view xdwsort.cpp @ 1:9341384c2785

added xdwsort.
author pyon@macmini
date Mon, 16 Oct 2017 20:51:59 +0900
parents
children edfa39292d78
line wrap: on
line source

/* Makefile
debug: xdwsort.cpp
	#rm -rf tempXXXX
	#cls
	gcc -g -O0 -I. xdwsort.cpp xdwapi.lib
	#date
	#./a.exe target.xdw
	#date

release: xdwsort.cpp
	gcc -I. xdwsort.cpp xdwapi.lib -static -o xdwsort.exe
	strip xdwsort.exe

clean:
	rm -rf tempXXXX
*/

#include <stdio.h>
#include <string.h>
#include <stdlib.h>
#include <time.h>
#include <glob.h>
#include <io.h>
#include <windows.h>
#include <xdw_api.h>

#define MAXCOL  1024
#define MAXLINE 9999
#define BLOCKSZ   64

void print_error( int code ) {
	fprintf( stderr, "Error code : %d\n", code );
	switch ( code ) {
	case XDW_E_NOT_INSTALLED:
		fprintf( stderr, "DocuWorksがインストールされていません。" );
		break;
	case XDW_E_FILE_NOT_FOUND:
		fprintf( stderr, "指定されたファイルが見つかりません。" );
		break;
	case XDW_E_FILE_EXISTS:
		fprintf( stderr, "指定されたファイルはすでに存在します。" );
		break;
	case XDW_E_ACCESSDENIED:
	case XDW_E_INVALID_NAME:
	case XDW_E_BAD_NETPATH:
		fprintf( stderr, "指定されたファイルを開くことができません。" );
		break;
	case XDW_E_BAD_FORMAT:
		fprintf( stderr, "指定されたファイルは正しいフォーマットではありません。" );
		break;
	case XDW_E_INVALID_ACCESS:
		fprintf( stderr, "指定された操作をする権利がありません。" );
		break;
	default:
		fprintf( stderr, "エラーが発生しました。" );
		break;
	}
}

void print_now( char *msg ) {
   time_t now = time( NULL );
   struct tm *ts = localtime( &now );

   char buf[80];
   strftime( buf, sizeof( buf ), "%H:%M:%S %Z", ts );
   printf( "%s\t%s\n", buf, msg );
}

int main( int argc, char* argv[] ) {

	/* オプションの解析 */
	char prog[128];
	strcpy( prog, argv[0] );

	int pnow = 0;
	char c;
	while ( --argc > 0 && ( *++argv )[0] == '-' ) {
		while ( c = *++argv[0] ) {
			switch ( c ) {
				case 'v':
					pnow = 1;
					print_now( "start." );
					break;
				case 'l':	/* now writing... */
					break;
				default:
					printf("error: illegal option '%c'.\n", c );
					exit( 1 );
			}
		}
	}

	if ( argc < 1 ) {
		fprintf( stderr, "%s infile\n", prog );
		fprintf( stderr, "%s -v infile\n", prog );
		exit( 1 );
	}

	/* ソートリストの取り込み */
	if ( pnow ) print_now( "reading sort-list." );

	FILE *fp;
	char buf[ MAXCOL ];
	char *sl = (char*)malloc( MAXLINE * sizeof( char ) * MAXCOL );

	if ( sl == NULL ) {
		fprintf( stderr, "can't allocate memory\n" );
		exit( 1 );
	}

	if ( ( fp = fopen( "sort.list", "r" ) ) == NULL ) {
		fprintf( stderr, "%s: can't open file [sort.list]\n", argv[0] );
		exit ( 1 );
	}

	char *p;
	int slN = 0;
	while ( fgets( buf, sizeof buf, fp ) ) {
		if ( !strncmp( buf, "#",  1 ) ) continue;
		if ( !strncmp( buf, "//", 2 ) ) continue;
		if ( !strcmp( buf, "\n" )     ) continue;

		if ( ( p = strchr( buf, '\n' ) ) != NULL ) {
			*p = '\0';
		}
		strncpy( &sl[ slN * MAXCOL ], buf, MAXCOL );
		slN++;
	}
	fclose( fp );
	/*
	for ( int j = 0; j < slN; j++ ) {
		printf( "%d : %s\n", j, &sl[ j * MAXCOL ] );
	}
	exit( 0 );
	*/

	/* 本処理:並び順を決定しつつ抽出作業 */
	if ( pnow ) print_now( "analizing xdw-file." );

	char in_path[ _MAX_PATH ];
	_fullpath( in_path, argv[0], _MAX_PATH );

	int api_result = 0;

	XDW_DOCUMENT_HANDLE h = NULL; // 文書ハンドルを開く
	XDW_OPEN_MODE_EX mode = {
		sizeof( XDW_OPEN_MODE_EX ), XDW_OPEN_READONLY, XDW_AUTH_NODIALOGUE
	};
	api_result = XDW_OpenDocumentHandle( in_path, &h, (XDW_OPEN_MODE*)&mode );
	if ( api_result < 0 ) {
		print_error( api_result );
		return 0;
	}

	XDW_DOCUMENT_INFO info = { sizeof( XDW_DOCUMENT_INFO ), 0, 0, 0 }; // 総ページ数を得る
	XDW_GetDocumentInformation( h, &info );
	int last_page = info.nPages;

	int *table = (int*)malloc( sizeof( int ) * last_page );
	for ( int p = 0; p < last_page; p++ ) {
		*( table + p ) = 9999;
	}
	int index = 0;
	XDW_FOUND_HANDLE pFoundHandle = NULL;
	for ( int i = 0; i < slN; i++ ) {
		for ( int p = 0; p < last_page; p++ ) {
			if ( *( table + p ) != 9999 ) continue;
			api_result = XDW_FindTextInPage( h, p + 1, &sl[ i * MAXCOL ], NULL, &pFoundHandle, NULL );
			if ( api_result < 0 ) {
				print_error( api_result );
				exit( 1 );
			}
			if ( pFoundHandle != NULL ) {
				*( table + p ) = ++index;
				//printf( "found : %s at %d\n", &sl[ i * MAXCOL ], p + 1 );
				pFoundHandle = NULL;
			}
		}
	}
	free( sl );

	if ( pnow ) print_now( "extracting pages." );
	mkdir( "tempXXXX" );
	for ( int p = 0; p < last_page; p++ ) {
		if ( *( table + p ) == 9999 ) {
			*( table + p ) = ++index;
		}
		//printf( "%d\n", *( table + p ) );
		sprintf( buf, "tempXXXX/%04d.xdw", *( table + p ) );
		_fullpath( in_path, buf, _MAX_PATH );
		api_result = XDW_GetPage( h, p + 1, in_path, NULL );
		if ( api_result < 0 ) {
			print_error( api_result );
			exit( 1 );
		}
	}
	free( table );

	XDW_CloseDocumentHandle( h, NULL ); // 文書ハンドルを閉じる

	/* マージ */
	if ( pnow ) print_now( "merging pages." );

	/* ブロック版 */
	char *blk_path = (char*)malloc( BLOCKSZ * sizeof( char ) * _MAX_PATH );
	const char **blk_path_addr = (const char**)malloc( ( last_page / BLOCKSZ + 1 ) * sizeof( char* ) * _MAX_PATH );

	int bn = 0;
	// ブロック毎の処理
	for ( int p = 0, m = 0; p < last_page; p++ ) {
		m = p % BLOCKSZ;
		if ( m == 0 && p > 0 ) {
			sprintf( buf, "tempXXXX/b%04d.xdw", ++bn );
			_fullpath( in_path, buf, _MAX_PATH );
			api_result = XDW_MergeXdwFiles( blk_path_addr, BLOCKSZ, in_path, NULL );
			if ( api_result < 0 ) {
				print_error( api_result );
				exit( 1 );
			}
		} 
		sprintf( buf, "tempXXXX/%04d.xdw", p + 1 );
		_fullpath( in_path, buf, _MAX_PATH );
		strncpy( &blk_path[ m * _MAX_PATH ], buf, _MAX_PATH );
		blk_path_addr[m] = &blk_path[ m * _MAX_PATH ];
	}
	if ( last_page % BLOCKSZ != 0 ) {
		sprintf( buf, "tempXXXX/b%04d.xdw", ++bn );
		_fullpath( in_path, buf, _MAX_PATH );
		api_result = XDW_MergeXdwFiles( blk_path_addr, last_page % BLOCKSZ, in_path, NULL );
		if ( api_result < 0 ) {
			print_error( api_result );
			exit( 1 );
		}
	}

	// ブロックをまとめる
	for ( int b = 0; b < bn; b++ ) {
		sprintf( buf, "tempXXXX/b%04d.xdw", b + 1 );
		_fullpath( in_path, buf, _MAX_PATH );
		strncpy( &blk_path[ b * _MAX_PATH ], buf, _MAX_PATH );
		blk_path_addr[b] = &blk_path[ b * _MAX_PATH ];
	}
	_fullpath( in_path, "tempXXXX/temp.xdw", _MAX_PATH );
	remove( in_path );
	api_result = XDW_MergeXdwFiles( blk_path_addr, bn, in_path, NULL );
	if ( api_result < 0 ) {
		print_error( api_result );
		exit( 1 );
	}

	free( blk_path );
	free( blk_path_addr );

	/* ふるぺーじばん ok
	char *buf_path = (char*)malloc( last_page * sizeof( char ) * _MAX_PATH );
	const char **buf_path_addr = (const char**)malloc( last_page * sizeof( char* ) * _MAX_PATH );
	if ( buf_path == NULL || buf_path_addr == NULL ) {
		fprintf( stderr, "can't allocate memory\n" );
		exit( 1 );
	}

	for ( int p = 0; p < last_page; p++ ) {
		sprintf( buf, "tempXXXX/%04d.xdw", p + 1 );
		_fullpath( buf, buf, _MAX_PATH );
		strncpy( &buf_path[ p * _MAX_PATH ], buf, _MAX_PATH );
		//printf( "%d %x %s\n", p, &buf_path[ p * _MAX_PATH ], &buf_path[ p * _MAX_PATH ] );
		buf_path_addr[p] = &buf_path[ p * _MAX_PATH ];
	}

	_fullpath( in_path, "tempXXXX/temp.xdw", _MAX_PATH );
	remove( in_path );
	api_result = XDW_MergeXdwFiles( buf_path_addr, last_page, in_path, NULL );
	if ( api_result < 0 ) {
		print_error( api_result );
		exit( 1 );
	}

	free( buf_path );
	free( buf_path_addr );
	*/

	/* 最適化 */
	if ( pnow ) print_now( "optimizing." );
	char out_path[ _MAX_PATH ];
	_fullpath( out_path, "out.xdw", _MAX_PATH );
	remove( out_path );
	api_result = XDW_OptimizeDocument( in_path, out_path, NULL );
	if ( api_result < 0 ) {
		print_error( api_result );
		exit( 1 );
	}

	/* 後処理 */
	if ( pnow ) print_now( "cleaning." );
	glob_t globbuf;
    glob( "tempXXXX/*.*", 0, NULL, &globbuf );
    for ( int i = 0; i < globbuf.gl_pathc; i++ ) {
		_fullpath( in_path, globbuf.gl_pathv[i], _MAX_PATH );
		remove( in_path );
    }
    globfree( &globbuf );
	rmdir( "tempXXXX" );

	if ( pnow ) print_now( "done." );
	return 0;
}