/***************************************************************************** bmptopnm.c ****************************************************************************** Bmptopnm - Converts from a Microsoft Windows or OS/2 .BMP file to a PBM, PGM, or PPM file. This program was formerly called Bmptoppm (and generated only PPM output). The name was changed in March 2002. Copyright (C) 1992 by David W. Sanderson. Permission to use, copy, modify, and distribute this software and its documentation for any purpose and without fee is hereby granted, provided that the above copyright notice appear in all copies and that both that copyright notice and this permission notice appear in supporting documentation. This software is provided "as is" without express or implied warranty. Note: From mid-2003 to mid-2007, this program would crash on any 16 bit BMP without transparency and no one reported it. Before that, it refused to even try to read a 16 bit BMP. I conclude that essentially nobody is using 16 bit BMP. *****************************************************************************/ #include #include #include #include "pm_c_util.h" #include "mallocvar.h" #include "shhopt.h" #include "nstring.h" #include "pnm.h" #include "bmp.h" static xelval const bmpMaxval = 255; /* The maxval for intensity values in a BMP image -- either in a truecolor raster or in a colormap */ enum rowOrder {BOTTOMUP, TOPDOWN}; struct bitPosition { /* mask and shift count to describe a set of bits in a binary value. Example: if 16 bits are laid out as XRRRRRGGGGGBBBBB then the shift count for the R component is 10 and the mask is 0000000000011111. A 'mask' of zero denotes absence of any bits; e.g. in the example above, the mask for the transparency component is zero because there is no transparency component . 'shift' is arbitrary in that case. */ unsigned int shift; /* How many bits right you have to shift the value to get the subject bits in the least significant bit positions. */ unsigned int mask; /* Has one bits in positions where the subject bits are after shifting. */ }; struct pixelformat { /* The format of a pixel representation from the raster. i.e. which bits apply to red, green, blue, and transparency */ struct bitPosition red; struct bitPosition blu; struct bitPosition grn; struct bitPosition trn; bool conventionalBgr; /* This means that the above bit positions are just the conventional BGR format -- one byte Blue, one byte Green, one byte Red, no alpha. Though it's totally redundant with the members above, this member speeds up computation: We've never actually seen a BMP file that doesn't use conventional BGR, and it doesn't require any masking or shifting at all to interpret. */ }; typedef struct { /* These are all encodings of floating point */ unsigned long x; unsigned long y; unsigned long z; } cieXyz; typedef struct { cieXyz red; cieXyz grn; cieXyz blu; } cieXyzTriple; struct bmpInfoHeader { enum rowOrder rowOrder; unsigned int cols; unsigned int rows; unsigned int cBitCount; /* Number of bits in the BMP file that each pixel occupies. */ enum bmpClass class; bool bitFields; /* The raster values are arranged in arbitrary bit fields as described by the "mask" values in the header, rather than fixed formats. */ unsigned int cmapSize; /* Size in bytes of the colormap (palette) in the BMP file. Zero means there is no colormap. */ unsigned int imageSize; /* Size in bytes of the image data. We only reference this when the image is compressed. */ unsigned short cPlanes; BMPCompType compression; struct pixelformat pixelformat; cieXyzTriple endPoints; }; struct cmdlineInfo { /* All the information the user supplied in the command line, in a form easy for the program to use. */ const char * inputFileName; unsigned int verbose; }; static const char * ifname; static void parseCommandLine(int argc, const char ** argv, struct cmdlineInfo * const cmdlineP) { /*---------------------------------------------------------------------------- Note that the file spec array we return is stored in the storage that was passed to us as the argv array. -----------------------------------------------------------------------------*/ optEntry * option_def; /* Used by OPTENT3 */ optStruct3 opt; unsigned int option_def_index; MALLOCARRAY_NOFAIL(option_def, 100); option_def_index = 0; /* incremented by OPTENT3 */ OPTENT3(0, "verbose", OPT_FLAG, NULL, &cmdlineP->verbose, 0); opt.opt_table = option_def; opt.short_allowed = FALSE; /* We have no short (old-fashioned) options */ opt.allowNegNum = FALSE; /* We have no parms that are negative numbers */ pm_optParseOptions4(&argc, argv, opt, sizeof(opt), 0); /* Uses and sets argc, argv, and some of *cmdlineP and others. */ if (argc-1 == 0) cmdlineP->inputFileName = "-"; else if (argc-1 != 1) pm_error("Program takes zero or one argument (filename). You " "specified %d", argc-1); else cmdlineP->inputFileName = argv[1]; } static const char er_read[] = "%s: read error"; static int GetByte(FILE * const fp) { int v; if ((v = getc(fp)) == EOF) pm_error(er_read, ifname); return v; } static short GetShort(FILE * const fp) { short v; if (pm_readlittleshort(fp, &v) == -1) pm_error(er_read, ifname); return v; } static short GetBigShort(FILE * const fp) { short v; if (pm_readbigshort(fp, &v) == -1) pm_error(er_read, ifname); return v; } static long GetLong(FILE * const fp) { long v; if (pm_readlittlelong(fp, &v) == -1) pm_error(er_read, ifname); return v; } static cieXyz GetCieXyz(FILE * const ifP) { cieXyz retval; retval.x = GetLong(ifP); retval.y = GetLong(ifP); retval.z = GetLong(ifP); return retval; } static cieXyzTriple GetCieXyzTriple(FILE * const ifP) { cieXyzTriple retval; retval.red = GetCieXyz(ifP); retval.grn = GetCieXyz(ifP); retval.blu = GetCieXyz(ifP); return retval; } static struct pixelformat defaultPixelformat(unsigned int const bitCount) { struct pixelformat retval; switch (bitCount) { case 16: /* This layout is sometimes called "RGB555". A document from Microsoft says this is the default (when the "compression" field of the header says COMP_BITFIELDS). */ retval.conventionalBgr = FALSE; retval.red.shift = 10; retval.grn.shift = 5; retval.blu.shift = 0; retval.trn.shift = 0; retval.red.mask = 0x1f; /* 5 bits */ retval.grn.mask = 0x1f; /* 5 bits */ retval.blu.mask = 0x1f; /* 5 bits */ retval.trn.mask = 0; break; case 24: case 32: retval.conventionalBgr = TRUE; retval.red.shift = 16; retval.grn.shift = 8; retval.blu.shift = 0; retval.trn.shift = 0; retval.red.mask = 0xff; /* 8 bits */ retval.grn.mask = 0xff; /* 8 bits */ retval.blu.mask = 0xff; /* 8 bits */ retval.trn.mask = 0; break; default: /* colormapped - masks are undefined */ break; } return retval; } static void readOffBytes(FILE * const fp, unsigned int const nbytes) { /*---------------------------------------------------------------------------- Read 'nbytes' from file 'fp'. Abort program if read error. -----------------------------------------------------------------------------*/ int i; for(i = 0; i < nbytes; ++i) { int rc; rc = getc(fp); if (rc == EOF) pm_error(er_read, ifname); } } static void bmpReadfileheader(FILE * const ifP, unsigned int * const bytesReadP, unsigned int * const offBitsP) { unsigned long offBits; if (GetByte(ifP) != 'B') pm_error("'%s' is not a BMP file. (It doesn't start with 'BM')", ifname); if (GetByte(ifP) != 'M') pm_error("'%s' is not a BMP file. (It doesn't start with 'BM')", ifname); /* fileSize = */ GetLong(ifP); /* This is not always reliable. */ /* xHotSpot = */ GetShort(ifP); /* yHotSpot = */ GetShort(ifP); offBits = GetLong(ifP); *offBitsP = offBits; assert(BMPlenfileheader() == 14); *bytesReadP = 14; } static void readOs2InfoHeaderRest(FILE * const ifP, struct bmpInfoHeader * const headerP) { /*---------------------------------------------------------------------------- Read the rest of the info header, after its size field, of an OS2 BMP from *ifP. Add the information from it to *headerP, in particular these members: cols rows rowOrder cPlanes cBitCount cmapSize pixelformat compression -----------------------------------------------------------------------------*/ unsigned short colsField, rowsField; unsigned short planesField, bitCountField; pm_readlittleshortu(ifP, &colsField); if (colsField == 0) pm_error("Invalid BMP file: says width is zero"); else headerP->cols = colsField; pm_readlittleshortu(ifP, &rowsField); if (rowsField == 0) pm_error("Invalid BMP file: says height is zero"); else headerP->rows = rowsField; headerP->rowOrder = BOTTOMUP; pm_readlittleshortu(ifP, &planesField); headerP->cPlanes = planesField; pm_readlittleshortu(ifP, &bitCountField); headerP->cBitCount = bitCountField; /* I actually don't know if the OS/2 BMP format allows cBitCount > 8 or if it does, what it means, but ppmtobmp creates such BMPs, more or less as a byproduct of creating the same for Windows BMP, so we interpret cBitCount > 8 the same as for Windows. */ if (headerP->cBitCount <= 8) headerP->cmapSize = 1 << headerP->cBitCount; else if (headerP->cBitCount == 24) headerP->cmapSize = 0; /* There is a 16 bit truecolor format, but we don't know how the bits are divided among red, green, and blue, so we can't handle it. */ else pm_error("Unrecognized bits per pixel in OS/2 BMP file header: %d", headerP->cBitCount); headerP->pixelformat = defaultPixelformat(headerP->cBitCount); headerP->compression = BMPCOMP_RGB; } static void validateCompression(unsigned long const compression, enum rowOrder const rowOrder, unsigned int const cBitCount) { if (compression != BMPCOMP_RGB && compression != BMPCOMP_BITFIELDS && compression != BMPCOMP_RLE4 && compression != BMPCOMP_RLE8) pm_error("Input has unknown encoding. " "Compression type code = %ld. The only ones we know " "are RGB (%u), BITFIELDS (%u), " "RLE4 (%u), and RLE8 (%u)", compression, BMPCOMP_RGB, BMPCOMP_BITFIELDS, BMPCOMP_RLE4, BMPCOMP_RLE8); if ((compression == BMPCOMP_RLE4 || compression == BMPCOMP_RLE8) && rowOrder == TOPDOWN ) pm_error("Invalid BMP header. Claims image is top-down and also " "compressed, which is an impossible combination."); if ((compression == BMPCOMP_RLE4 && cBitCount !=4 ) || (compression == BMPCOMP_RLE8 && cBitCount !=8 )) pm_error("Invalid BMP header. " "Compression type (%s) disagrees with " "number of bits per pixel (%u).", compression == BMPCOMP_RLE4 ? "RLE4" : "RLE8", cBitCount); } static void readWindowsBasic40ByteInfoHeader(FILE * const ifP, struct bmpInfoHeader * const headerP) { /*---------------------------------------------------------------------------- Read from the file stream 'ifP' the basic BMP Info header. This does not include any Info header extension. The Info header is the data that comes after the BMP file header. Return the information from the info header as *headerP. -----------------------------------------------------------------------------*/ int colorsused; /* ColorsUsed value from header */ unsigned short planesField, bitCountField; int32_t colsField; pm_readlittlelong2(ifP, &colsField); if (colsField == 0) pm_error("Invalid BMP file: says width is zero"); else if (colsField < 0) pm_error("Invalid BMP file: says width is negative (%d)", colsField); else headerP->cols = (unsigned int)colsField; { long const cy = GetLong(ifP); if (cy == 0) pm_error("Invalid BMP file: says height is zero"); if (cy < 0) { headerP->rowOrder = TOPDOWN; headerP->rows = - cy; } else { headerP->rowOrder = BOTTOMUP; headerP->rows = cy; } } pm_readlittleshortu(ifP, &planesField); headerP->cPlanes = planesField; pm_readlittleshortu(ifP, &bitCountField); headerP->cBitCount = bitCountField; { unsigned long int const compression = GetLong(ifP); validateCompression(compression, headerP->rowOrder, headerP->cBitCount); headerP->bitFields = (compression == BMPCOMP_BITFIELDS); headerP->compression = compression; } /* And read the rest of the junk in the 40 byte header */ headerP->imageSize = GetLong(ifP); /* ImageSize */ GetLong(ifP); /* XpixelsPerMeter */ GetLong(ifP); /* YpixelsPerMeter */ colorsused = GetLong(ifP); /* ColorsUsed */ /* See comments in bmp.h for info about the definition of the following word and its relationship to the color map size (headerP->cmapSize). */ /* colorsimportant = */ GetLong(ifP); /* ColorsImportant */ if (headerP->cBitCount <= 8) { if (colorsused != 0) { if (colorsused > 1 << headerP->cBitCount) pm_error("Invalid BMP header. Says %u bits per pixel, " "but %d colors used", headerP->cBitCount, colorsused); else if (colorsused == 1 && headerP->cBitCount == 1) { pm_message("Abnormal BMP header. Says 1 bit per pixel. " "Should have 2 colors, but says only 1 color used. " ); headerP->cmapSize = colorsused; } else headerP->cmapSize = colorsused; } else headerP->cmapSize = 1 << headerP->cBitCount; } else if (headerP->cBitCount == 24 || headerP->cBitCount == 16 || headerP->cBitCount == 32) headerP->cmapSize = 0; else pm_error("Unrecognized bits per pixel in Windows BMP file header: %d", headerP->cBitCount); } static unsigned int lsbZeroCount(unsigned int const mask) /*---------------------------------------------------------------------------- Return the number of consecutive zeroes in the mask 'mask', starting with the least significant bit and going up. E.g. for 0x20, it would be 5. Use GCC built-in when available. -----------------------------------------------------------------------------*/ #if HAVE_GCC_BITCOUNT { return ( mask==0 ? sizeof(mask)*8 : __builtin_ctz(mask) ); } #else { unsigned int i=0; while (((mask >> i) & 0x1) == 0 && i < sizeof(mask)*8) ++i; return i; } #endif static struct bitPosition bitPositionFromMask(long const bmpMask) { struct bitPosition retval; retval.shift = lsbZeroCount(bmpMask); retval.mask = bmpMask >> retval.shift; return retval; } static void computeConventionalBgr(struct pixelformat * const fP, unsigned int const bitCount) { switch (bitCount) { case 24: fP->conventionalBgr = fP->red.shift == 0 && fP->red.mask == 0xFF && fP->grn.shift == 8 && fP->grn.mask == 0xFF && fP->blu.shift == 16 && fP->blu.mask == 0xFF && fP->trn.mask == 0 ; break; case 32: fP->conventionalBgr = fP->red.shift == 8 && fP->red.mask == 0xFF && fP->grn.shift == 16 && fP->grn.mask == 0xFF && fP->blu.shift == 24 && fP->blu.mask == 0xFF && fP->trn.mask == 0 ; break; default: fP->conventionalBgr = FALSE; } } static void readV4InfoHeaderExtension(FILE * const ifP, struct bmpInfoHeader * const headerP, unsigned int * const bytesReadP) { unsigned long redMsk, grnMsk, bluMsk, trnMsk; redMsk = GetLong(ifP); grnMsk = GetLong(ifP); bluMsk = GetLong(ifP); trnMsk = GetLong(ifP); if (headerP->bitFields) { /* A document from Microsoft says on Windows 95 there is no transparency plane and (red, green, blue) must be either (5,5,5) or (5,6,5) for 16 bit and (8,8,8) for 32 bit. It calls these RGB555, RGB565, RGB888. */ headerP->pixelformat.red = bitPositionFromMask(redMsk); headerP->pixelformat.grn = bitPositionFromMask(grnMsk); headerP->pixelformat.blu = bitPositionFromMask(bluMsk); headerP->pixelformat.trn = bitPositionFromMask(trnMsk); computeConventionalBgr(&headerP->pixelformat, headerP->cBitCount); } else headerP->pixelformat = defaultPixelformat(headerP->cBitCount); GetLong(ifP); /* Color space */ headerP->endPoints = GetCieXyzTriple(ifP); /* 36 bytes */ GetLong(ifP); /* GammaRed */ GetLong(ifP); /* GammaGreen */ GetLong(ifP); /* GammaBlue */ *bytesReadP = 68; } static void readV5InfoHeaderExtension(FILE * const ifP, struct bmpInfoHeader * const headerP, unsigned int * const bytesReadP) { GetLong(ifP); /* Intent */ GetLong(ifP); /* ProfileData */ GetLong(ifP); /* ProfileSize */ GetLong(ifP); /* Reserved */ *bytesReadP = 16; } static void defaultV4InfoHeaderExtension(struct bmpInfoHeader * const headerP) { headerP->pixelformat = defaultPixelformat(headerP->cBitCount); } static void readWindowsInfoHeaderRest(FILE * const ifP, unsigned int const cInfoHeaderSize, struct bmpInfoHeader * const headerP) { /*---------------------------------------------------------------------------- Read the rest of the info header, after the length field, of a Windows BMP from *ifP. 'cInfoHeaderSize' is the size of the info header, not counting its size field. Note that besides telling us how much data to read, this also implies which of the three major formats the data is in. Add the information from it to *headerP, in particular these members: cols rows rowOrder cPlanes cBitCount bitFields compression imageSize cmapSize pixelformat endPoints -----------------------------------------------------------------------------*/ /* There are 3 major formats of Windows BMP, identified by the 3 info header lengths. The original one is 40 bytes. The "V4 header" is 108 bytes and was new with Windows 95 and NT 4.0. The "V5 header" is 124 bytes and was new with Windows 98 and Windows 2000. */ unsigned int bytesRead; readWindowsBasic40ByteInfoHeader(ifP, headerP); bytesRead = 40; if (cInfoHeaderSize >= BMP_HDRLEN_WIN_V4) { unsigned int v4BytesRead; readV4InfoHeaderExtension(ifP, headerP, &v4BytesRead); bytesRead += v4BytesRead; assert(bytesRead == BMP_HDRLEN_WIN_V4); } else defaultV4InfoHeaderExtension(headerP); if (cInfoHeaderSize >= BMP_HDRLEN_WIN_V5) { unsigned int v5BytesRead; readV5InfoHeaderExtension(ifP, headerP, &v5BytesRead); bytesRead += v5BytesRead; assert(bytesRead == BMP_HDRLEN_WIN_V5); } for (; bytesRead < cInfoHeaderSize;) { GetByte(ifP); ++bytesRead; } assert(bytesRead == cInfoHeaderSize); } static void bmpReadinfoheader(FILE * const ifP, unsigned int * const bytesReadP, struct bmpInfoHeader * const headerP, const char ** const errorP) { unsigned int const cInfoHeaderSize = GetLong(ifP); const char * error; BMPdetermineclass(cInfoHeaderSize, &headerP->class, &error); if (error) { pm_asprintf(errorP, "Cannot determine the class of BMP from the " "info header size %u. %s", cInfoHeaderSize, error); pm_strfree(error); } else { switch (headerP->class) { case BMP_C_WIN_V1: case BMP_C_WIN_V2: case BMP_C_WIN_V3: case BMP_C_WIN_V4: case BMP_C_WIN_V5: readWindowsInfoHeaderRest(ifP, cInfoHeaderSize, headerP); break; case BMP_C_OS2_1x: case BMP_C_OS2_2x: readOs2InfoHeaderRest(ifP, headerP); break; } *errorP = NULL; *bytesReadP = cInfoHeaderSize; } /* Part of our anti-arithmetic overflow strategy is to make sure height and width always fit in 16 bits, so they can be multiplied together. This shouldn't be a problem, since they come from 16 bit fields in the BMP info header. */ assert(headerP->cols < (1<<16)); assert(headerP->rows < (1<<16)); } static void bmpReadColormap(FILE * const ifP, enum bmpClass const class, xel ** const colormapP, unsigned int const cmapSize, unsigned int * const bytesReadP) { /*---------------------------------------------------------------------------- Read the color map from the present position in the input BMP file *ifP. The map has 'cmapSize' entries in it. cmapSize == 0 means there is no color map. We return a color map as *colormapP. If there is no color map in the BMP, this is just an arbitrary color map. 'class' is the class of BMP image - Windows or OS/2. -----------------------------------------------------------------------------*/ xel * const colormap = pnm_allocrow(MAX(1, cmapSize)); unsigned int i; unsigned int bytesRead; for (i = 0, bytesRead = 0; i < cmapSize; ++i) { /* There is a document that says the bytes are ordered R,G,B,Z, but in practice it appears to be the following instead: */ unsigned int const b = GetByte(ifP); unsigned int const g = GetByte(ifP); unsigned int const r = GetByte(ifP); unsigned int j; PNM_ASSIGN(colormap[i], r, g, b); bytesRead += 3; for (j = 3; j < BMPlenrgb(class); ++j) { GetByte(ifP); bytesRead += 1; } } *colormapP = colormap; *bytesReadP = bytesRead; } static void extractBitFields(unsigned int const rasterval, struct pixelformat const pixelformat, pixval const maxval, pixval * const rP, pixval * const gP, pixval * const bP, pixval * const aP) { unsigned int const rbits = (rasterval >> pixelformat.red.shift) & pixelformat.red.mask; unsigned int const gbits = (rasterval >> pixelformat.grn.shift) & pixelformat.grn.mask; unsigned int const bbits = (rasterval >> pixelformat.blu.shift) & pixelformat.blu.mask; unsigned int const abits = (rasterval >> pixelformat.trn.shift) & pixelformat.trn.mask; *rP = pixelformat.red.mask > 0 ? (unsigned int) rbits * maxval / pixelformat.red.mask : 0; *gP = pixelformat.grn.mask > 0 ? (unsigned int) gbits * maxval / pixelformat.grn.mask : 0; *bP = pixelformat.blu.mask > 0 ? (unsigned int) bbits * maxval / pixelformat.blu.mask : 0; *aP = pixelformat.trn.mask > 0 ? (unsigned int) abits * maxval / pixelformat.trn.mask : 0; } static void convertRow16(unsigned char const bmprow[], xel xelrow[], int const cols, struct pixelformat const pixelformat) { /* It's truecolor. */ unsigned int col; unsigned int cursor; cursor = 0; for (col=0; col < cols; ++col) { unsigned short const rasterval = (unsigned short) bmprow[cursor+1] << 8 | bmprow[cursor+0]; pixval r, g, b, a; extractBitFields(rasterval, pixelformat, 255, &r, &g, &b, &a); PNM_ASSIGN(xelrow[col], r, g, b); cursor += 2; } } static void convertRow24(unsigned char const bmprow[], xel xelrow[], int const cols, struct pixelformat const pixelformat) { /* It's truecolor */ /* There is a document that gives a much different format for 24 bit BMPs. But this seems to be the de facto standard, and is, with a little ambiguity and contradiction resolved, defined in the Microsoft BMP spec. */ unsigned int col; unsigned int cursor; cursor = 0; for (col = 0; col < cols; ++col) { pixval r, g, b, a; if (pixelformat.conventionalBgr) { r = bmprow[cursor+2]; g = bmprow[cursor+1]; b = bmprow[cursor+0]; a = 0; } else { unsigned int const rasterval = (bmprow[cursor+0] << 16) + (bmprow[cursor+1] << 8) + (bmprow[cursor+2] << 0); extractBitFields(rasterval, pixelformat, 255, &r, &g, &b, &a); } PNM_ASSIGN(xelrow[col], r, g, b); cursor += 3; } } static void convertRow32(unsigned char const bmprow[], xel xelrow[], int const cols, struct pixelformat const pixelformat) { /* It's truecolor */ unsigned int col; unsigned int cursor; cursor = 0; for (col = 0; col < cols; ++col) { pixval r, g, b, a; if (pixelformat.conventionalBgr) { /* bmprow[cursor+3] is just padding */ r = bmprow[cursor+2]; g = bmprow[cursor+1]; b = bmprow[cursor+0]; a = 0; } else { unsigned int const rasterval = (bmprow[cursor+0] << 24) + (bmprow[cursor+1] << 16) + (bmprow[cursor+2] << 8) + (bmprow[cursor+3] << 0); extractBitFields(rasterval, pixelformat, 255, &r, &g, &b, &a); } PNM_ASSIGN(xelrow[col], bmprow[cursor+2], bmprow[cursor+1], bmprow[cursor+0]); cursor += 4; } } static void validateIndex(unsigned int const index, unsigned int const cmapSize ) { if (index >= cmapSize) pm_error("Error: invalid index to color palette."); } static void convertRow(unsigned char const bmprow[], xel xelrow[], int const cols, unsigned int const cBitCount, struct pixelformat const pixelformat, xel const colormap[], unsigned int const cmapSize ) { /*---------------------------------------------------------------------------- Convert a row in raw BMP raster format bmprow[] to a row of xels xelrow[]. Use maxval 255 for the output xels. The BMP image has 'cBitCount' bits per pixel. If the image is colormapped, colormap[] is the colormap (colormap[i] is the color with color index i). -----------------------------------------------------------------------------*/ if (cBitCount == 24) convertRow24(bmprow, xelrow, cols, pixelformat); else if (cBitCount == 16) convertRow16(bmprow, xelrow, cols, pixelformat); else if (cBitCount == 32) convertRow32(bmprow, xelrow, cols, pixelformat); else if (cBitCount == 8) { /* It's a whole byte colormap index */ unsigned int col; for (col = 0; col < cols; ++col) { unsigned int const index = bmprow[col]; validateIndex(index, cmapSize); xelrow[col] = colormap[index]; } } else if (cBitCount == 1 || cBitCount == 2 || cBitCount == 4) { /* It's a bit field color index */ unsigned char const mask = ( 1 << cBitCount ) - 1; unsigned int col; for (col = 0; col < cols; ++col) { unsigned int const cursor = (col*cBitCount)/8; unsigned int const shift = 8 - ((col*cBitCount) % 8) - cBitCount; unsigned int const index = (bmprow[cursor] & (mask << shift)) >> shift; validateIndex(index, cmapSize); xelrow[col] = colormap[index]; } } else { /* Every possible BMP bits per pixel is handled above */ assert(false); } } static unsigned char ** allocBmpRaster(unsigned int const rows, unsigned int const bytesPerRow) { unsigned int const storageSize = rows * sizeof(unsigned char *) + rows * bytesPerRow; unsigned char ** bmpRaster; unsigned int row; unsigned char * startOfRows; /* The raster array consists of an array of pointers to the rows followed by the rows of bytes, in a single allocated chunk of storage. */ if (UINT_MAX / (bytesPerRow + sizeof(unsigned char *)) < rows) pm_error("raster is ridiculously large."); bmpRaster = (unsigned char **) malloc(storageSize); if (bmpRaster == NULL) pm_error("Unable to allocate %u bytes for the BMP raster\n", storageSize); startOfRows = (unsigned char *)(bmpRaster + rows); for (row = 0; row < rows; ++row) bmpRaster[row] = startOfRows + row * bytesPerRow; return bmpRaster; } static void readrow(FILE * const ifP, unsigned int const row, unsigned int const bytesPerRow, unsigned char ** const bmpRaster, unsigned int * const bytesReadP) { size_t bytesRead; assert(bytesPerRow > 0); bytesRead = fread(bmpRaster[row], 1, bytesPerRow, ifP); if (bytesRead < bytesPerRow) { if (feof(ifP)) pm_error("End of file reading row %u of BMP raster.", row); else pm_error("Error reading BMP raster. Errno=%d (%s)", errno, strerror(errno)); } *bytesReadP += bytesRead; } static void nybbleAlign(unsigned char * const bytes, unsigned int const nybbleCt){ /*---------------------------------------------------------------------------- Shift the 'nybbleCt' nybbles of bytes[], after the first byte, one nybble toward the left, with the first of those nybble shifting into the right half of the first byte. Leave the left half of the first byte alone. Example: (Numbers in hex, 8 nybbles) 5? 13 7E 89 A1 becomes 51 37 E8 9A 10 -----------------------------------------------------------------------------*/ unsigned int const fullByteCt = (nybbleCt + 1) / 2; unsigned int i; bytes[0] >>= 4; for (i = 0; i < fullByteCt; ++i) bytes[i] = bytes[i] << 4 | bytes[i+1] >> 4; if (nybbleCt % 2 == 0) { /* There is a final right nybble. Shift it. */ bytes[fullByteCt] <<= 4; } } enum rleStatus { ABS_MODE, ENC_MODE, END_OF_ROW, END_OF_BMP, DELTA }; static enum rleStatus readRLEcode(FILE * const ifP, unsigned int * const cntP, unsigned char * const codeP) { unsigned short s; enum rleStatus retval; s = GetBigShort(ifP); if (s == 0) retval = END_OF_ROW; else if (s == 1) retval = END_OF_BMP; else if (s == 2) retval = DELTA; else if (s < 256) { if (cntP) *cntP = s & 0xff; retval = ABS_MODE; } else { if (cntP && codeP) { *cntP = (s >> 8) & 0xff; *codeP = s & 0xff; } retval = ENC_MODE; } return retval; } static void readrowRLE(FILE * const ifP, unsigned int const row, unsigned int const cols, bool const lastrow, BMPCompType const compression, unsigned char ** const bmpRaster, unsigned int * const bytesReadP) { bool const rle4 = (compression == BMPCOMP_RLE4); int const pixelsPerRowMargin = rle4 ? cols % 2 : 0; char const err_decode[] = "Error while decoding compressed BMP image. " "%s. Row: %u Pixel: %u" ; unsigned int totalBytesRead; unsigned int pixelsRead; /* There are RLE4 images with rows coded up to the byte boundary, resulting in each row one pixel larger than the column length stated in the BMP info header (header.cols) when the column length is odd. pixelsPerRowMargin is a "wart" to provide for this case. */ totalBytesRead = 0; /* Initial value */ pixelsRead = 0; /* Initial value */ while (true) { unsigned int n; /* decompressed bytes already read; current write point */ unsigned int cnt; unsigned char code; n = rle4 ? (pixelsRead + 1) / 2 : pixelsRead; switch (readRLEcode(ifP, &cnt, &code)) { case ENC_MODE: { unsigned int const byteCnt = rle4 ? (cnt + 1) /2 : cnt; unsigned int i; if (pixelsRead + cnt > cols + pixelsPerRowMargin) pm_error(err_decode, "Too many pixels in encoded mode", row, pixelsRead ); for (i = 0; i < byteCnt; ++i) bmpRaster[row][n+i] = code; if (rle4 && pixelsRead % 2 == 1) /* previous read ended odd */ nybbleAlign(&bmpRaster[row][n-1], cnt); pixelsRead += cnt; totalBytesRead += 2; } break; case ABS_MODE: { unsigned int cmpBytesRead; /* compressed bytes read */ /* align read-end to 16 bit boundary */ unsigned int const bytesToRead = rle4 ? (cnt + 3) / 4 * 2 : (cnt + 1) / 2 * 2; if (pixelsRead + cnt > cols + pixelsPerRowMargin) pm_error(err_decode, "Too many pixels in absolute mode", row, pixelsRead); cmpBytesRead = fread(&bmpRaster[row][n], sizeof(char), bytesToRead, ifP); if (cmpBytesRead < bytesToRead) { if (feof(ifP)) pm_error("End of file reading row %u " "of compressed BMP raster.", row); else pm_error("Error reading BMP raster. Errno=%d (%s)", errno, strerror(errno)); } if (rle4 && pixelsRead % 2 == 1) /* previous read ended odd */ nybbleAlign(&bmpRaster[row][n-1], cnt); pixelsRead += cnt; totalBytesRead += cmpBytesRead + 2; } break; case END_OF_ROW: { if (cols == pixelsRead || cols + pixelsPerRowMargin == pixelsRead) { if (!lastrow) { *bytesReadP += totalBytesRead + 2; return; } else if (readRLEcode(ifP, NULL, NULL) == END_OF_BMP) { *bytesReadP += totalBytesRead +4; return; } else /* lastrow and END_OF_BITMAP not detected */ pm_error(err_decode, "End of bitmap not marked", row, pixelsRead ); } else pm_error(err_decode, "Premature end of row", row, pixelsRead); } break; case END_OF_BMP: { if (lastrow && (cols == pixelsRead || cols + pixelsPerRowMargin == pixelsRead)){ *bytesReadP += totalBytesRead + 2; return; } else pm_error(err_decode, "Premature end of bitmap", row, pixelsRead ); /* Windows programs do not reject premature end of bitmap. Rather, they set the remaining pixels of the raster to an arbitrary value. In practice, images with incomplete bitmaps are rare. */ } break; case DELTA: { /* Delta means "move the point (col,row) by the amount given in the next two bytes." Like premature end of bitmap, the official specs do not specify what value the skipped pixels should be set to. Judging from Windows utilities, there is no consensus within Microsoft either. */ pm_error(err_decode, "Delta code in compressed BMP image. " "This program does not process deltas", row, pixelsRead); } break; default: pm_error("Internal error processing RLE code in row %u", row); } } } static void bmpReadraster(FILE * const ifP, unsigned int const cols, unsigned int const rows, enum rowOrder const rowOrder, unsigned int const cBitCount, BMPCompType const compression, unsigned char *** const bmpRasterP, unsigned int * const bytesReadP) { /*---------------------------------------------------------------------------- Read the raster from the BMP file on *ifP (which is positioned to the raster). The raster is 'rows' rows of 'cols' columns, 'cBitCount' bits per pixel, with rows in order 'rowOrder'. Return the raster in a newly malloced 2-dimensional array and return a pointer to that array as *bmpRasterP. Leave the input file positioned immediately after the raster and return as *bytesReadP the number of bytes we read from the file (i.e. the number of bytes in the raster portion of the file). -----------------------------------------------------------------------------*/ unsigned int const bytesPerRow = (compression == BMPCOMP_RLE4) ? cols / 2 + 2 : (compression == BMPCOMP_RLE8) ? cols + 1 : ((cols * cBitCount + 31) / 32) * 4; /* A BMP raster row is a multiple of 4 bytes, padded on the right with don't cares. */ unsigned char ** bmpRaster; assert(cols < (1<<16)); assert(bytesPerRow < (1<<16)); bmpRaster = allocBmpRaster(rows, bytesPerRow); *bytesReadP = 0; /* row order BOTTOMUP is by far the most common case - the bottom line is first in the file, the top line last. We have never actually seen TOPDOWN, except in a Microsoft spec */ switch(compression){ case BMPCOMP_RGB: case BMPCOMP_BITFIELDS: { unsigned int i; for (i = 0; i < rows; ++i) readrow(ifP, rowOrder == TOPDOWN ? i : rows - i - 1, bytesPerRow, bmpRaster, bytesReadP); } break; case BMPCOMP_RLE4: case BMPCOMP_RLE8: { unsigned int i; /* Read all rows except last */ assert(rows >= 1); for (i = 0; i < rows - 1; ++i){ readrowRLE(ifP, rowOrder == TOPDOWN ? i : rows - i - 1, cols, FALSE, compression, bmpRaster, bytesReadP); } /* Read last row */ readrowRLE(ifP, rowOrder == TOPDOWN ? i : rows - i - 1, cols, TRUE, compression, bmpRaster, bytesReadP); } break; case BMPCOMP_JPEG: pm_error("BMP file uses JPEG compression. We don't know how to " "interpret that."); break; case BMPCOMP_PNG: pm_error("BMP file uses PNG compression. We don't know how to " "interpret that."); break; } *bmpRasterP = bmpRaster; } static void reportHeader(struct bmpInfoHeader const header, unsigned int const offBits, bool const verbose) { if (verbose) { pm_message("BMP image header says:"); pm_message(" Class of BMP: %s", BMPClassName(header.class)); pm_message(" Width: %d pixels", header.cols); pm_message(" Height: %d pixels", header.rows); pm_message(" Depth: %d planes", header.cPlanes); pm_message(" Row order: %s", header.rowOrder == BOTTOMUP ? "bottom up" : "top down"); pm_message(" Byte offset of raster within file: %u", offBits); pm_message(" Bits per pixel in raster: %u", header.cBitCount); pm_message(" Compression: %s", BMPCompTypeName(header.compression)); pm_message(" Colors in color map: %u", header.cmapSize); } else { pm_message("%s BMP, %ux%ux%u", BMPClassName(header.class), header.cols, header.rows, header.cBitCount); } } static void validateCPlanes(unsigned short const cPlanes) { if (cPlanes != 1) pm_error("Error: invalid planes value in BMP header. Must be 1"); } static void analyzeColors(xel const colormap[], unsigned int const cmapSize, xelval const maxval, bool * const grayPresentP, bool * const colorPresentP) { if (cmapSize == 0) { /* No colormap, and we're not about to search the entire raster, so we just assume it's full color */ *colorPresentP = TRUE; *grayPresentP = TRUE; } else { unsigned int i; *colorPresentP = FALSE; /* initial assumption */ *grayPresentP = FALSE; /* initial assumption */ for (i = 0; i < cmapSize; ++i) { if (PPM_ISGRAY(colormap[i])) { if (PPM_GETR(colormap[i]) != 0 && PPM_GETR(colormap[i]) != maxval) *grayPresentP = TRUE; } else *colorPresentP = TRUE; } } } static void warnIfOffBitsWrong(struct bmpInfoHeader const bmpHeader, unsigned int const offBits) { if (offBits != BMPoffbits(bmpHeader.class, bmpHeader.cBitCount, bmpHeader.cmapSize)) { pm_message("warning: the BMP header says the raster starts " "at offset %u bytes into the file (offbits), " "but that there are %u bytes of information before " "the raster. This inconsistency probably means the " "input file is not a legal BMP file and is unusable.", offBits, BMPoffbits(bmpHeader.class, bmpHeader.cBitCount, bmpHeader.cmapSize)); } } static void readColorMap(FILE * const ifP, struct bmpInfoHeader const bmpHeader, xel ** const colorMapP, unsigned int * const posP) { unsigned int bytesRead; bmpReadColormap(ifP, bmpHeader.class, colorMapP, bmpHeader.cmapSize, &bytesRead); *posP += bytesRead; } static void readRaster(FILE * const ifP, struct bmpInfoHeader const bmpHeader, unsigned char *** const bmpRasterP, unsigned int * const posP) { unsigned int bytesRead; bmpReadraster(ifP, bmpHeader.cols, bmpHeader.rows, bmpHeader.rowOrder, bmpHeader.cBitCount, bmpHeader.compression, bmpRasterP, &bytesRead); *posP += bytesRead; } static bool isValidBmpBpp(unsigned int const cBitCount) { switch (cBitCount) { case 1: case 2: case 4: case 8: case 16: case 24: case 32: return true; default: return false; } } static void readBmp(FILE * const ifP, unsigned char *** const bmpRasterP, unsigned int * const colsP, unsigned int * const rowsP, bool * const grayPresentP, bool * const colorPresentP, unsigned int * const cBitCountP, struct pixelformat * const pixelformatP, xel ** const colormapP, unsigned int * const cmapSizeP, bool const verbose) { xel * colormap; /* malloc'ed */ unsigned int pos; /* Current byte position in the BMP file */ /* The following are all information from the BMP headers */ unsigned int offBits; /* Byte offset into file of raster */ struct bmpInfoHeader bmpHeader; pos = 0; /* Starting at the beginning ... */ { unsigned int bytesRead; bmpReadfileheader(ifP, &bytesRead, &offBits); pos += bytesRead; } { unsigned int bytesRead; const char * error; bmpReadinfoheader(ifP, &bytesRead, &bmpHeader, &error); if (error) pm_error("Failed to read the BMP info header. Image may " "not be a valid BMP. %s", error); if (verbose) pm_message("Read %u bytes of header", bytesRead); pos += bytesRead; } reportHeader(bmpHeader, offBits, verbose); validateCPlanes(bmpHeader.cPlanes); warnIfOffBitsWrong(bmpHeader, offBits); readColorMap(ifP, bmpHeader, &colormap, &pos); analyzeColors(colormap, bmpHeader.cmapSize, bmpMaxval, grayPresentP, colorPresentP); readOffBytes(ifP, offBits - pos); pos = offBits; readRaster(ifP, bmpHeader, bmpRasterP, &pos); if (fgetc(ifP) != EOF) pm_message("warning: some image data remains unread."); if (!isValidBmpBpp(bmpHeader.cBitCount)) pm_error("Invalid BMP image: 'cBitCount' field of header " "(number of bits for each pixel in raster) is %u", bmpHeader.cBitCount); *cBitCountP = bmpHeader.cBitCount; *colsP = bmpHeader.cols; *rowsP = bmpHeader.rows; *pixelformatP = bmpHeader.pixelformat; *colormapP = colormap; *cmapSizeP = bmpHeader.cmapSize; } static void writeRasterGen(unsigned char ** const bmpRaster, unsigned int const cols, unsigned int const rows, int const format, unsigned int const cBitCount, struct pixelformat const pixelformat, xel const colormap[], unsigned int const cmapSize) { /*---------------------------------------------------------------------------- Write the PNM raster to Standard Output, corresponding to the raw BMP raster bmpRaster. Write the raster assuming the PNM image has dimensions 'cols' by 'rows' and format 'format', with maxval 255. The BMP image has 'cBitCount' bits per pixel, arranged in format 'pixelformat'. If the image is colormapped, colormap[] is the colormap (colormap[i] is the color with color index i). writeRasterPbm() is faster for a PBM image. -----------------------------------------------------------------------------*/ xel * xelrow; unsigned int row; xelrow = pnm_allocrow(cols); for (row = 0; row < rows; ++row) { convertRow(bmpRaster[row], xelrow, cols, cBitCount, pixelformat, colormap, cmapSize); pnm_writepnmrow(stdout, xelrow, cols, bmpMaxval, format, FALSE); } pnm_freerow(xelrow); } static void writeRasterPbm(unsigned char ** const bmpRaster, unsigned int const cols, unsigned int const rows, xel const colormap[]) { /*---------------------------------------------------------------------------- Write the PBM raster to Standard Output corresponding to the raw BMP raster bmpRaster. Write the raster assuming the PBM image has dimensions 'cols' by 'rows'. The BMP image has 'cBitCount' bits per pixel, arranged in format 'pixelformat'. The image must be colormapped; colormap[] is the colormap (colormap[i] is the color with color index i). We cannot handle the abnormal case in which colormap[0] and colormap[1] have the same value (i.e. both white or both black.) We destroy *bmpRaster as a side effect. -----------------------------------------------------------------------------*/ unsigned int const colCharCt = pbm_packed_bytes(cols); unsigned int row; enum colorFormat {BlackWhite, WhiteBlack}; enum colorFormat colorformat; if (PPM_GETR(colormap[0]) > 0) colorformat = WhiteBlack; else colorformat = BlackWhite; for (row = 0; row < rows; ++row){ unsigned char * const bitrow = bmpRaster[row]; if (colorformat == BlackWhite) { unsigned int i; for (i = 0; i < colCharCt; ++i) bitrow[i] = ~bitrow[i]; /* flip all pixels */ } pbm_cleanrowend_packed(bitrow, cols); pbm_writepbmrow_packed(stdout, bitrow, cols, FALSE); } } int main(int argc, const char ** argv) { struct cmdlineInfo cmdline; FILE * ifP; int outputType; bool grayPresent, colorPresent; /* These tell whether the image contains shades of gray other than black and white and whether it has colors other than black, white, and gray. */ unsigned int cols, rows; unsigned char ** bmpRaster; /* The raster part of the BMP image, as a row x column array, with each element being a raw byte from the BMP raster. Note that bmpRaster[0] is really Row 0 -- the top row of the image, even though the bottom row comes first in the BMP format. */ unsigned int cBitCount; /* Number of bits in BMP raster for each pixel */ struct pixelformat pixelformat; /* Format of the raster bits for a single pixel */ xel * colormap; /* Malloc'ed colormap (palette) from the BMP. Contents of map undefined if not a colormapped BMP. */ unsigned int cmapSize; /* Number of colormap entries. From BMP header. Note that a file may be 8 bits per pixel but have fewer than 256 colors. In the 1 bit per pixel case, there should be 2 entries according to the official specification, but we allow files with just 1. */ pm_proginit(&argc, argv); parseCommandLine(argc, argv, &cmdline); ifP = pm_openr(cmdline.inputFileName); if (streq(cmdline.inputFileName, "-")) ifname = "Standard Input"; else ifname = cmdline.inputFileName; readBmp(ifP, &bmpRaster, &cols, &rows, &grayPresent, &colorPresent, &cBitCount, &pixelformat, &colormap, &cmapSize, cmdline.verbose); pm_close(ifP); if (colorPresent) { outputType = PPM_TYPE; pm_message("WRITING PPM IMAGE"); } else if (grayPresent) { outputType = PGM_TYPE; pm_message("WRITING PGM IMAGE"); } else { outputType = PBM_TYPE; pm_message("WRITING PBM IMAGE"); } if (outputType == PBM_TYPE && cBitCount == 1){ pbm_writepbminit(stdout, cols, rows, FALSE); writeRasterPbm(bmpRaster, cols, rows, colormap); } else { pnm_writepnminit(stdout, cols, rows, bmpMaxval, outputType, FALSE); writeRasterGen(bmpRaster, cols, rows, outputType, cBitCount, pixelformat, colormap, cmapSize); } free(colormap); free(bmpRaster); return 0; }