1/* 2 * unbwt.c for libdivsufsort 3 * Copyright (c) 2003-2008 Yuta Mori All Rights Reserved. 4 * 5 * Permission is hereby granted, free of charge, to any person 6 * obtaining a copy of this software and associated documentation 7 * files (the "Software"), to deal in the Software without 8 * restriction, including without limitation the rights to use, 9 * copy, modify, merge, publish, distribute, sublicense, and/or sell 10 * copies of the Software, and to permit persons to whom the 11 * Software is furnished to do so, subject to the following 12 * conditions: 13 * 14 * The above copyright notice and this permission notice shall be 15 * included in all copies or substantial portions of the Software. 16 * 17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 18 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES 19 * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 20 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT 21 * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, 22 * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING 23 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 24 * OTHER DEALINGS IN THE SOFTWARE. 25 */ 26 27#if HAVE_CONFIG_H 28# include "config.h" 29#endif 30#include <stdio.h> 31#if HAVE_STRING_H 32# include <string.h> 33#endif 34#if HAVE_STDLIB_H 35# include <stdlib.h> 36#endif 37#if HAVE_MEMORY_H 38# include <memory.h> 39#endif 40#if HAVE_STDDEF_H 41# include <stddef.h> 42#endif 43#if HAVE_STRINGS_H 44# include <strings.h> 45#endif 46#if HAVE_SYS_TYPES_H 47# include <sys/types.h> 48#endif 49#if HAVE_IO_H && HAVE_FCNTL_H 50# include <io.h> 51# include <fcntl.h> 52#endif 53#include <time.h> 54#include <divsufsort.h> 55#include "lfs.h" 56 57 58static 59size_t 60read_int(FILE *fp, saidx_t *n) { 61 unsigned char c[4]; 62 size_t m = fread(c, sizeof(unsigned char), 4, fp); 63 if(m == 4) { 64 *n = (c[0] << 0) | (c[1] << 8) | 65 (c[2] << 16) | (c[3] << 24); 66 } 67 return m; 68} 69 70static 71void 72print_help(const char *progname, int status) { 73 fprintf(stderr, 74 "unbwt, an inverse burrows-wheeler transform program, version %s.\n", 75 divsufsort_version()); 76 fprintf(stderr, "usage: %s INFILE OUTFILE\n\n", progname); 77 exit(status); 78} 79 80int 81main(int argc, const char *argv[]) { 82 FILE *fp, *ofp; 83 const char *fname, *ofname; 84 sauchar_t *T; 85 saidx_t *A; 86 LFS_OFF_T n; 87 size_t m; 88 saidx_t pidx; 89 clock_t start, finish; 90 saint_t err, blocksize, needclose = 3; 91 92 /* Check arguments. */ 93 if((argc == 1) || 94 (strcmp(argv[1], "-h") == 0) || 95 (strcmp(argv[1], "--help") == 0)) { print_help(argv[0], EXIT_SUCCESS); } 96 if(argc != 3) { print_help(argv[0], EXIT_FAILURE); } 97 98 /* Open a file for reading. */ 99 if(strcmp(argv[1], "-") != 0) { 100#if HAVE_FOPEN_S 101 if(fopen_s(&fp, fname = argv[1], "rb") != 0) { 102#else 103 if((fp = LFS_FOPEN(fname = argv[1], "rb")) == NULL) { 104#endif 105 fprintf(stderr, "%s: Cannot open file `%s': ", argv[0], fname); 106 perror(NULL); 107 exit(EXIT_FAILURE); 108 } 109 } else { 110#if HAVE__SETMODE && HAVE__FILENO 111 if(_setmode(_fileno(stdin), _O_BINARY) == -1) { 112 fprintf(stderr, "%s: Cannot set mode: ", argv[0]); 113 perror(NULL); 114 exit(EXIT_FAILURE); 115 } 116#endif 117 fp = stdin; 118 fname = "stdin"; 119 needclose ^= 1; 120 } 121 122 /* Open a file for writing. */ 123 if(strcmp(argv[2], "-") != 0) { 124#if HAVE_FOPEN_S 125 if(fopen_s(&ofp, ofname = argv[2], "wb") != 0) { 126#else 127 if((ofp = LFS_FOPEN(ofname = argv[2], "wb")) == NULL) { 128#endif 129 fprintf(stderr, "%s: Cannot open file `%s': ", argv[0], ofname); 130 perror(NULL); 131 exit(EXIT_FAILURE); 132 } 133 } else { 134#if HAVE__SETMODE && HAVE__FILENO 135 if(_setmode(_fileno(stdout), _O_BINARY) == -1) { 136 fprintf(stderr, "%s: Cannot set mode: ", argv[0]); 137 perror(NULL); 138 exit(EXIT_FAILURE); 139 } 140#endif 141 ofp = stdout; 142 ofname = "stdout"; 143 needclose ^= 2; 144 } 145 146 /* Read the blocksize. */ 147 if(read_int(fp, &blocksize) != 4) { 148 fprintf(stderr, "%s: Cannot read from `%s': ", argv[0], fname); 149 perror(NULL); 150 exit(EXIT_FAILURE); 151 } 152 153 /* Allocate 5blocksize bytes of memory. */ 154 T = (sauchar_t *)malloc(blocksize * sizeof(sauchar_t)); 155 A = (saidx_t *)malloc(blocksize * sizeof(saidx_t)); 156 if((T == NULL) || (A == NULL)) { 157 fprintf(stderr, "%s: Cannot allocate memory.\n", argv[0]); 158 exit(EXIT_FAILURE); 159 } 160 161 fprintf(stderr, "UnBWT (blocksize %" PRIdSAINT_T ") ... ", blocksize); 162 start = clock(); 163 for(n = 0; (m = read_int(fp, &pidx)) != 0; n += m) { 164 /* Read blocksize bytes of data. */ 165 if((m != 4) || ((m = fread(T, sizeof(sauchar_t), blocksize, fp)) == 0)) { 166 fprintf(stderr, "%s: %s `%s': ", 167 argv[0], 168 (ferror(fp) || !feof(fp)) ? "Cannot read from" : "Unexpected EOF in", 169 fname); 170 perror(NULL); 171 exit(EXIT_FAILURE); 172 } 173 174 /* Inverse Burrows-Wheeler Transform. */ 175 if((err = inverse_bw_transform(T, T, A, m, pidx)) != 0) { 176 fprintf(stderr, "%s (reverseBWT): %s.\n", 177 argv[0], 178 (err == -1) ? "Invalid data" : "Cannot allocate memory"); 179 exit(EXIT_FAILURE); 180 } 181 182 /* Write m bytes of data. */ 183 if(fwrite(T, sizeof(sauchar_t), m, ofp) != m) { 184 fprintf(stderr, "%s: Cannot write to `%s': ", argv[0], ofname); 185 perror(NULL); 186 exit(EXIT_FAILURE); 187 } 188 } 189 if(ferror(fp)) { 190 fprintf(stderr, "%s: Cannot read from `%s': ", argv[0], fname); 191 perror(NULL); 192 exit(EXIT_FAILURE); 193 } 194 finish = clock(); 195 fprintf(stderr, "%" PRIdOFF_T " bytes: %.4f sec\n", 196 n, (double)(finish - start) / (double)CLOCKS_PER_SEC); 197 198 /* Close files */ 199 if(needclose & 1) { fclose(fp); } 200 if(needclose & 2) { fclose(ofp); } 201 202 /* Deallocate memory. */ 203 free(A); 204 free(T); 205 206 return 0; 207} 208