Newer
Older
#include "MantidAPI/FileProperty.h"
Federico Montesino Pouzols
committed
#include "MantidAPI/MultipleFileProperty.h"
#include "MantidAPI/NumericAxis.h"
#include "MantidDataHandling/LoadFITS.h"
#include "MantidDataObjects/Workspace2D.h"
Federico Montesino Pouzols
committed
#include "MantidKernel/BoundedValidator.h"
#include <boost/algorithm/string.hpp>
#include <boost/scoped_ptr.hpp>
Federico Montesino Pouzols
committed
#include <Poco/BinaryReader.h>
#include <Poco/FileStream.h>
#include <Poco/Path.h>
using namespace Mantid::API;
using namespace Mantid::Kernel;
namespace {
/**
* Reinterpret a byte sequence as InterpretType and cast to double
* @param Pointer to byte src
*/
template <typename InterpretType> double toDouble(uint8_t *src) {
return static_cast<double>(*reinterpret_cast<InterpretType *>(src));
}
}
namespace Mantid {
namespace DataHandling {
// Register the algorithm into the AlgorithmFactory
DECLARE_FILELOADER_ALGORITHM(LoadFITS)
// Static class constants
const std::string LoadFITS::g_BIT_DEPTH_NAME = "BitDepthName";
const std::string LoadFITS::g_ROTATION_NAME = "RotationName";
const std::string LoadFITS::g_AXIS_NAMES_NAME = "AxisNames";
const std::string LoadFITS::g_IMAGE_KEY_NAME = "ImageKeyName";
const std::string LoadFITS::g_HEADER_MAP_NAME = "HeaderMapFile";
const std::string LoadFITS::g_defaultImgType = "SAMPLE";
Federico Montesino Pouzols
committed
/**
* Constructor. Just initialize everything to prevent issues.
*/
Federico Montesino Pouzols
committed
LoadFITS::LoadFITS()
: m_headerScaleKey(), m_headerOffsetKey(), m_headerBitDepthKey(),
m_headerRotationKey(), m_headerImageKeyKey(), m_headerAxisNameKeys(),
Federico Montesino Pouzols
committed
m_mapFile(), m_pixelCount(0) {
setupDefaultKeywordNames();
}
/**
* Return the confidence with with this algorithm can load the file
* @param descriptor A descriptor for the file
* @returns An integer specifying the confidence level. 0 indicates it will not
* be used
*/
int LoadFITS::confidence(Kernel::FileDescriptor &descriptor) const {
// Should really improve this to check the file header (of first file at
// least) to make sure it contains the fields wanted
return (descriptor.extension() == ".fits" || descriptor.extension() == ".fit")
? 80
: 0;
}
/**
* Initialise the algorithm. Declare properties which can be set before execution
* (input) or
* read from after the execution (output).
*/
void LoadFITS::init() {
// Specify file extensions which can be associated with a FITS file.
std::vector<std::string> exts, exts2;
// Declare the Filename algorithm property. Mandatory. Sets the path to the
// file to load.
exts.clear();
exts.push_back(".fits");
exts.push_back(".fit");
exts2.push_back(".*");
declareProperty(new MultipleFileProperty("Filename", exts),
Federico Montesino Pouzols
committed
"The name of the input file (note that you can give "
"multiple file names separated by commas).");
declareProperty(new API::WorkspaceProperty<API::Workspace>(
"OutputWorkspace", "", Kernel::Direction::Output));
Federico Montesino Pouzols
committed
declareProperty(
new Kernel::PropertyWithValue<bool>("LoadAsRectImg", false,
Kernel::Direction::Input),
"If enabled (not by default), the output Workspace2D will have "
"one histogram per row and one bin per pixel, such that a 2D "
"color plot (color fill plot) will display an image.");
Federico Montesino Pouzols
committed
auto zeroOrPosDbl = boost::make_shared<BoundedValidator<double>>();
zeroOrPosDbl->setLower(0.0);
declareProperty("FilterNoiseLevel", 0.0, zeroOrPosDbl,
"Threshold to remove noisy pixels. Try 50 for example.");
Federico Montesino Pouzols
committed
auto posInt = boost::make_shared<BoundedValidator<int>>();
posInt->setLower(1);
declareProperty("BinSize", 1, posInt,
"Rebunch n*n on both axes, generating pixels with sums of "
Federico Montesino Pouzols
committed
"blocks of n by n original pixels.");
Federico Montesino Pouzols
committed
auto posDbl = boost::make_shared<BoundedValidator<double>>();
posDbl->setLower(std::numeric_limits<double>::epsilon());
declareProperty("Scale", 80.0, posDbl, "Pixels per cm.",
Kernel::Direction::Input);
new FileProperty(g_HEADER_MAP_NAME, "", FileProperty::OptionalDirectory,
Federico Montesino Pouzols
committed
"", Kernel::Direction::Input),
"A file mapping header key names to non-standard names [line separated "
"values in the format KEY=VALUE, e.g. BitDepthName=BITPIX] - do not use "
"this if you want to keep compatibility with standard FITS files.");
* Execute the algorithm.
*/
// for non-standard headers, by default won't do anything
Federico Montesino Pouzols
committed
std::string fName = getPropertyValue("Filename");
std::vector<std::string> paths;
boost::split(paths, fName, boost::is_any_of(","));
Federico Montesino Pouzols
committed
int binSize = getProperty("BinSize");
double noiseThresh = getProperty("FilterNoiseLevel");
Federico Montesino Pouzols
committed
bool loadAsRectImg = getProperty("LoadAsRectImg");
Federico Montesino Pouzols
committed
const std::string outWSName = getPropertyValue("OutputWorkspace");
doLoadFiles(paths, outWSName, loadAsRectImg, binSize, noiseThresh);
}
/**
* Load header(s) from FITS file(s) into FITSInfo header
* struct(s). This is usually the first step when loading FITS files
* into workspaces or anything else. In the simplest case, paths has
* only one string and only one header struct is added in headers.
*
* @param paths File name(s)
* @param headers Vector where to store the header struct(s)
*
* @throws std::runtime_error if issues are found in the headers
*/
void LoadFITS::doLoadHeaders(const std::vector<std::string> &paths,
std::vector<FITSInfo> &headers) {
headers.resize(paths.size());
for (size_t i = 0; i < paths.size(); ++i) {
headers[i].extension = "";
headers[i].filePath = paths[i];
Federico Montesino Pouzols
committed
Federico Montesino Pouzols
committed
// Get various pieces of information from the file header which are used
// to
try {
parseHeader(headers[i]);
} catch (std::exception &e) {
Federico Montesino Pouzols
committed
// Unable to parse the header, throw.
throw std::runtime_error(
"Severe problem found while parsing the header of "
"this FITS file (" +
paths[i] +
"). This file may not be standard FITS. Error description: " +
e.what());
Federico Montesino Pouzols
committed
}
// Get and convert specific standard header values which will are
// needed to know how to load the data: BITPIX, NAXIS, NAXISi (where i =
// 1..NAXIS, e.g. NAXIS2 for two axis).
Federico Montesino Pouzols
committed
try {
Federico Montesino Pouzols
committed
std::string tmpBitPix = headers[i].headerKeys[m_headerBitDepthKey];
Federico Montesino Pouzols
committed
if (boost::contains(tmpBitPix, "-")) {
boost::erase_all(tmpBitPix, "-");
headers[i].isFloat = true;
Federico Montesino Pouzols
committed
} else {
headers[i].isFloat = false;
Federico Montesino Pouzols
committed
}
Federico Montesino Pouzols
committed
try {
headers[i].bitsPerPixel = boost::lexical_cast<int>(tmpBitPix);
Federico Montesino Pouzols
committed
} catch (std::exception &e) {
throw std::runtime_error(
"Coult not interpret the entry number of bits per pixel (" +
m_headerBitDepthKey + ") as an integer. Error: " + e.what());
}
// Check that the files use bit depths of either 8, 16 or 32
if (headers[i].bitsPerPixel != 8 && headers[i].bitsPerPixel != 16 &&
headers[i].bitsPerPixel != 32 && headers[i].bitsPerPixel != 64)
throw std::runtime_error(
"This algorithm only supports 8, 16, 32 or 64 "
"bits per pixel. The header of file '" +
paths[i] + "' says that its bit depth is: " +
boost::lexical_cast<std::string>(headers[i].bitsPerPixel));
} catch (std::exception &e) {
throw std::runtime_error(
"Failed to process the '" + m_headerBitDepthKey +
"' entry (bits per pixel) in the header of this file: " + paths[i] +
". Error description: " + e.what());
}
try {
Federico Montesino Pouzols
committed
// Add the image key, use the value in the FITS header if found,
// otherwise default (to SAMPLE).
auto it = headers[i].headerKeys.find(m_headerImageKeyKey);
if (headers[i].headerKeys.end() != it) {
headers[i].imageKey = it->second;
Federico Montesino Pouzols
committed
} else {
headers[i].imageKey = g_defaultImgType;
Federico Montesino Pouzols
committed
}
} catch (std::exception &e) {
throw std::runtime_error("Failed to process the '" + m_headerImageKeyKey +
"' entry (type of image: sample, dark, open) in "
"the header of this file: " +
paths[i] + ". Error description: " + e.what());
}
try {
headers[i].numberOfAxis = static_cast<int>(m_headerAxisNameKeys.size());
for (int j = 0; headers.size() > i && j < headers[i].numberOfAxis; ++j) {
headers[i].axisPixelLengths.push_back(boost::lexical_cast<size_t>(
headers[i].headerKeys[m_headerAxisNameKeys[j]]));
// only debug level, when loading multiple files this is very verbose
g_log.debug() << "Found axis length header entry: "
<< m_headerAxisNameKeys[j] << " = "
<< headers[i].axisPixelLengths.back() << std::endl;
// Various extensions to the FITS format are used elsewhere, and
// must be parsed differently if used. This loader Loader
// doesn't support this.
headers[i].extension = headers[i].headerKeys["XTENSION"];
} catch (std::exception &e) {
throw std::runtime_error(
"Failed to process the '" + m_headerNAxisNameKey +
"' entries (dimensions) in the header of this file: " + paths[i] +
". Error description: " + e.what());
Federico Montesino Pouzols
committed
Federico Montesino Pouzols
committed
// scale parameter, header BSCALE in the fits standard
if ("" == headers[i].headerKeys[m_headerScaleKey]) {
headers[i].scale = 1;
} else {
try {
headers[i].scale = boost::lexical_cast<double>(
headers[i].headerKeys[m_headerScaleKey]);
Federico Montesino Pouzols
committed
} catch (std::exception &e) {
throw std::runtime_error(
"Coult not interpret the entry number of bits per pixel (" +
m_headerBitDepthKey + " = " +
headers[i].headerKeys[m_headerScaleKey] +
Federico Montesino Pouzols
committed
") as a floating point number (double). Error: " + e.what());
}
}
// data offsset parameter, header BZERO in the fits standard
if ("" == headers[i].headerKeys[m_headerOffsetKey]) {
headers[i].offset = 0;
} else {
try {
headers[i].offset =
boost::lexical_cast<int>(headers[i].headerKeys[m_headerOffsetKey]);
Federico Montesino Pouzols
committed
} catch (std::exception & /*e*/) {
Federico Montesino Pouzols
committed
// still, second try with floating point format (as used for example
// by
Federico Montesino Pouzols
committed
// Starlight XPRESS cameras)
try {
double doff = boost::lexical_cast<double>(
headers[i].headerKeys[m_headerOffsetKey]);
Federico Montesino Pouzols
committed
double intPart;
if (0 != modf(doff, &intPart)) {
// anyway we'll do a cast, but warn if there was a fraction
g_log.warning()
<< "The value given in the FITS header entry for the data "
"offset (" +
m_headerOffsetKey + " = " +
headers[i].headerKeys[m_headerOffsetKey] +
Federico Montesino Pouzols
committed
") has a fractional part, and it will be ignored!"
<< std::endl;
}
headers[i].offset = static_cast<int>(doff);
} catch (std::exception &e) {
throw std::runtime_error(
"Coult not interpret the entry number of data offset (" +
m_headerOffsetKey + " = " +
headers[i].headerKeys[m_headerOffsetKey] +
") as an integer number nor a floating point "
"number (double). Error: " +
Federico Montesino Pouzols
committed
e.what());
}
}
}
// Check each header is valid/supported: standard (no extension to
// FITS), and has two axis
headerSanityCheck(headers[i], headers[0]);
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
/**
* Checks that a FITS header (once loaded) is valid/supported:
* standard (no extension to FITS), and has two axis with the expected
* dimensions.
*
* @param hdr FITS header struct loaded from a file - to check
*
* @param hdrFirst FITS header struct loaded from a (first) reference file -
*to
* compare against
*
* @throws std::exception if there's any issue or unsupported entry in the
* header
*/
void LoadFITS::headerSanityCheck(const FITSInfo &hdr,
const FITSInfo &hdrFirst) {
bool valid = true;
if (hdr.extension != "") {
valid = false;
g_log.error() << "File " << hdr.filePath
<< ": extensions found in the header." << std::endl;
}
if (hdr.numberOfAxis != 2) {
valid = false;
g_log.error() << "File " << hdr.filePath
<< ": the number of axes is not 2 but: " << hdr.numberOfAxis
<< std::endl;
}
// Test current item has same axis values as first item.
if (hdr.axisPixelLengths[0] != hdrFirst.axisPixelLengths[0]) {
valid = false;
g_log.error() << "File " << hdr.filePath
<< ": the number of pixels in the first dimension differs "
"from the first file loaded (" << hdrFirst.filePath
<< "): " << hdr.axisPixelLengths[0]
<< " != " << hdrFirst.axisPixelLengths[0] << std::endl;
}
if (hdr.axisPixelLengths[1] != hdrFirst.axisPixelLengths[1]) {
valid = false;
g_log.error() << "File " << hdr.filePath
<< ": the number of pixels in the second dimension differs"
"from the first file loaded (" << hdrFirst.filePath
<< "): " << hdr.axisPixelLengths[0]
<< " != " << hdrFirst.axisPixelLengths[0] << std::endl;
}
// Check the format is correct and create the Workspace
if (!valid) {
// Invalid files, record error
throw std::runtime_error(
"An issue has been found in the header of this FITS file: " +
hdr.filePath +
". This algorithm currently doesn't support FITS files with "
"non-standard extensions, more than two axis "
"of data, or has detected that all the files are "
"not similar.");
}
}
/**
* Create FITS file information for each file selected. Loads headers
* and data from the files and creates and fills the output
* workspace(s).
*
* @param paths File names as given in the algorithm input property
*
* @param outWSName name of the output (group) workspace to create
*
* @param loadAsRectImg Load files with 1 spectrum per row and 1 bin
* per column, so a color fill plot displays the image
*
* @param binSize size to rebin (1 == no re-bin == default)
*
* @param noiseThresh threshold for noise filtering
*
* @throw std::runtime_error when load fails (for example a memory
* allocation issue, wrong rebin requested, etc.)
*/
void LoadFITS::doLoadFiles(const std::vector<std::string> &paths,
const std::string &outWSName, bool loadAsRectImg,
int binSize, double noiseThresh) {
std::vector<FITSInfo> headers;
doLoadHeaders(paths, headers);
// No extension is set -> it's the standard format which we can parse.
if (headers[0].numberOfAxis > 0)
m_pixelCount += headers[0].axisPixelLengths[0];
// Presumably 2 axis, but futureproofing.
for (int i = 1; i < headers[0].numberOfAxis; ++i) {
m_pixelCount *= headers[0].axisPixelLengths[i];
}
// Check consistency of binSize asap
for (int i = 0; i < headers[0].numberOfAxis; ++i) {
if (0 != (headers[0].axisPixelLengths[i] % binSize)) {
throw std::runtime_error(
"Cannot rebin this image in blocks of " +
boost::lexical_cast<std::string>(binSize) + " x " +
boost::lexical_cast<std::string>(binSize) +
" pixels as requested because the size of dimension " +
boost::lexical_cast<std::string>(i + 1) + " (" +
boost::lexical_cast<std::string>(headers[0].axisPixelLengths[i]) +
") is not a multiple of the bin size.");
}
}
MantidImage imageY(headers[0].axisPixelLengths[1],
std::vector<double>(headers[0].axisPixelLengths[0]));
MantidImage imageE(headers[0].axisPixelLengths[1],
std::vector<double>(headers[0].axisPixelLengths[0]));
size_t bytes = (headers[0].bitsPerPixel / 8) * m_pixelCount;
std::vector<char> buffer;
try {
buffer.resize(bytes);
} catch (std::exception &) {
throw std::runtime_error(
"Could not allocate enough memory to run when trying to allocate " +
boost::lexical_cast<std::string>(bytes) + " bytes.");
}
// Create a group for these new workspaces, if the group already exists, add
// to it.
std::string groupName = outWSName;
size_t fileNumberInGroup = 0;
WorkspaceGroup_sptr wsGroup;
if (!AnalysisDataService::Instance().doesExist(groupName)) {
wsGroup = WorkspaceGroup_sptr(new WorkspaceGroup());
wsGroup->setTitle(groupName);
} else {
// Get the name of the latest file in group to start numbering from
if (AnalysisDataService::Instance().doesExist(groupName))
wsGroup =
AnalysisDataService::Instance().retrieveWS<WorkspaceGroup>(groupName);
std::string latestName = wsGroup->getNames().back();
// Set next file number
fileNumberInGroup = fetchNumber(latestName) + 1;
}
size_t totalWS = headers.size();
// Create a progress reporting object
API::Progress progress(this, 0, 1, totalWS + 1);
progress.report(0, "Loading file(s) into workspace(s)");
// Create first workspace (with instrument definition). This is also used as
// a template for creating others
Federico Montesino Pouzols
committed
Workspace2D_sptr imgWS;
imgWS = makeWorkspace(headers[0], fileNumberInGroup, buffer, imageY, imageE,
imgWS, loadAsRectImg, binSize, noiseThresh);
progress.report(1, "First file loaded.");
Federico Montesino Pouzols
committed
wsGroup->addWorkspace(imgWS);
if (isInstrOtherThanIMAT(headers[0])) {
// For now we assume IMAT except when specific headers are found by
// isInstrOtherThanIMAT()
//
// TODO: do this conditional on INSTR='IMAT' when we have proper IMAT .fits
// files
try {
IAlgorithm_sptr loadInst = createChildAlgorithm("LoadInstrument");
std::string directoryName =
Kernel::ConfigService::Instance().getInstrumentDirectory();
directoryName = directoryName + "/IMAT_Definition.xml";
loadInst->setPropertyValue("Filename", directoryName);
loadInst->setProperty<MatrixWorkspace_sptr>(
Federico Montesino Pouzols
committed
"Workspace", boost::dynamic_pointer_cast<MatrixWorkspace>(imgWS));
loadInst->execute();
} catch (std::exception &ex) {
g_log.information("Cannot load the instrument definition. " +
std::string(ex.what()));
}
}
// don't feel tempted to parallelize this loop as it is - it uses the same
// imageY and imageE buffers for all the workspaces
for (int64_t i = 1; i < static_cast<int64_t>(totalWS); ++i) {
Federico Montesino Pouzols
committed
imgWS = makeWorkspace(headers[i], fileNumberInGroup, buffer, imageY, imageE,
imgWS, loadAsRectImg, binSize, noiseThresh);
progress.report("Loaded file " + boost::lexical_cast<std::string>(i + 1) +
" of " + boost::lexical_cast<std::string>(totalWS));
Federico Montesino Pouzols
committed
wsGroup->addWorkspace(imgWS);
}
setProperty("OutputWorkspace", wsGroup);
}
Federico Montesino Pouzols
committed
/**
* Read a single files header and populate an object with the information.
Federico Montesino Pouzols
committed
*
* @param headerInfo A FITSInfo file object to parse header
* information into. This object must have its field filePath set to
* the input file
Federico Montesino Pouzols
committed
*
* A typical simple FITS header looks like this:
@verbatim
SIMPLE = T / file does conform to FITS standard
BITPIX = 16 / number of bits per data pixel
NAXIS = 2 / number of data axes
NAXIS1 = 512 / length of data axis 1
NAXIS2 = 512 / length of data axis 2
EXTEND = T / FITS dataset may contain extensions
COMMENT FITS (Flexible Image Transport System) format is defined in 'Astronomy
COMMENT and Astrophysics', volume 376, page 359; bibcode: 2001A&A...376..359H
TOF = 0.0595897599999995 / Ttime of flight from the external trigger
TIMEBIN = 4.096E-005 / Time width of this image
N_COUNTS= 182976 / Total counts in this image
N_TRIGS = 4426 / Number of triggers acquired
END
@endverbatim
*
* @throws various std::runtime_error etc. on read failure
*/
void LoadFITS::parseHeader(FITSInfo &headerInfo) {
headerInfo.headerSizeMultiplier = 0;
std::ifstream istr(headerInfo.filePath.c_str(), std::ios::binary);
Federico Montesino Pouzols
committed
istr.seekg(0, istr.end);
if (!(istr.tellg() > 0)) {
Federico Montesino Pouzols
committed
throw std::runtime_error(
"Found a file that is readable but empty (0 bytes size): " +
Federico Montesino Pouzols
committed
headerInfo.filePath);
}
istr.seekg(0, istr.beg);
Poco::BinaryReader reader(istr);
// Iterate 80 bytes at a time until header is parsed | 2880 bytes is the
// fixed header length of FITS
// 2880/80 = 36 iterations required
Federico Montesino Pouzols
committed
const std::string commentKW = "COMMENT";
bool endFound = false;
while (!endFound) {
headerInfo.headerSizeMultiplier++;
Federico Montesino Pouzols
committed
const int entriesPerHDU = 36;
for (int i = 0; i < entriesPerHDU; ++i) {
// Keep vect of each header item, including comments, and also keep a
// map of individual keys.
std::string part;
reader.readRaw(80, part);
headerInfo.headerItems.push_back(part);
Federico Montesino Pouzols
committed
// from the FITS standard about COMMENT: This keyword shall have no
// associated value; columns 9-80 may contain any ASCII text.
// That includes '='
if (boost::iequals(commentKW, part.substr(0, commentKW.size()))) {
continue;
}
// Add non-comment key/values. These hey and value are separated by the
// character '='. All keys should be unique.
// This will simply and silenty ignore any entry without the '='
auto eqPos = part.find('=');
if (eqPos > 0) {
std::string key = part.substr(0, eqPos);
std::string value = part.substr(eqPos + 1);
Federico Montesino Pouzols
committed
// Comments on header entries are added after the value separated by a /
// symbol. Exclude those comments.
auto slashPos = value.find('/');
if (slashPos > 0)
value = value.substr(0, slashPos);
boost::trim(key);
boost::trim(value);
if (key == "END")
endFound = true;
if (key != "")
headerInfo.headerKeys[key] = value;
}
}
}
istr.close();
Federico Montesino Pouzols
committed
}
* Creates and initialises a workspace with instrument definition and fills it
* with data
*
* @param fileInfo information for the current file
Federico Montesino Pouzols
committed
*
* @param newFileNumber sequence number for the new file when added
* into ws group
*
* @param buffer pre-allocated buffer to contain data values
* @param imageY Object to set the Y data values in
* @param imageE Object to set the E data values in
Federico Montesino Pouzols
committed
*
* @param parent A workspace which can be used to copy initialisation
* information from (size/instrument def etc)
Federico Montesino Pouzols
committed
* @param loadAsRectImg if true, the new workspace will have one
* spectrum per row and one bin per column, instead of the (default)
* as many spectra as pixels.
*
* @param binSize size to rebin (1 == no re-bin == default)
*
* @param noiseThresh threshold for noise filtering
*
* @returns A newly created Workspace2D, as a shared pointer
Workspace2D_sptr
LoadFITS::makeWorkspace(const FITSInfo &fileInfo, size_t &newFileNumber,
std::vector<char> &buffer, MantidImage &imageY,
Federico Montesino Pouzols
committed
MantidImage &imageE, const Workspace2D_sptr parent,
bool loadAsRectImg, int binSize, double noiseThresh) {
Federico Montesino Pouzols
committed
// Create workspace (taking into account already here if rebinning is
// going to happen)
if (!parent) {
Federico Montesino Pouzols
committed
if (!loadAsRectImg) {
size_t finalPixelCount = m_pixelCount / binSize * binSize;
ws = boost::dynamic_pointer_cast<Workspace2D>(
WorkspaceFactory::Instance().create("Workspace2D", finalPixelCount, 2,
1));
Federico Montesino Pouzols
committed
} else {
ws = boost::dynamic_pointer_cast<Workspace2D>(
WorkspaceFactory::Instance().create(
Federico Montesino Pouzols
committed
"Workspace2D",
fileInfo.axisPixelLengths[1] / binSize, // one bin per column
fileInfo.axisPixelLengths[0] / binSize +
Federico Montesino Pouzols
committed
1, // one spectrum per row
fileInfo.axisPixelLengths[0] / binSize));
Federico Montesino Pouzols
committed
}
} else {
ws = boost::dynamic_pointer_cast<Workspace2D>(
WorkspaceFactory::Instance().create(parent));
Federico Montesino Pouzols
committed
// this pixel scale property is used to set the workspace X values
double cm_1 = getProperty("Scale");
Federico Montesino Pouzols
committed
// amount of width units (e.g. cm) per pixel
Federico Montesino Pouzols
committed
double cmpp = 1; // cm per pixel == bin width
if (0.0 != cm_1)
cmpp /= cm_1;
cmpp *= static_cast<double>(binSize);
Federico Montesino Pouzols
committed
if (loadAsRectImg && 1 == binSize) {
Federico Montesino Pouzols
committed
// set data directly into workspace
readDataToWorkspace(fileInfo, cmpp, ws, buffer);
} else {
readDataToImgs(fileInfo, imageY, imageE, buffer);
doFilterNoise(noiseThresh, imageY, imageE);
Federico Montesino Pouzols
committed
Federico Montesino Pouzols
committed
// Note this can change the sizes of the images and the number of pixels
if (1 == binSize) {
Federico Montesino Pouzols
committed
ws->setImageYAndE(imageY, imageE, 0, loadAsRectImg, cmpp,
false /* no parallel load */);
Federico Montesino Pouzols
committed
Federico Montesino Pouzols
committed
} else {
MantidImage rebinnedY(imageY.size() / binSize,
std::vector<double>(imageY[0].size() / binSize));
MantidImage rebinnedE(imageE.size() / binSize,
std::vector<double>(imageE[0].size() / binSize));
Federico Montesino Pouzols
committed
doRebin(binSize, imageY, imageE, rebinnedY, rebinnedE);
Federico Montesino Pouzols
committed
ws->setImageYAndE(rebinnedY, rebinnedE, 0, loadAsRectImg, cmpp,
false /* no parallel load */);
}
Federico Montesino Pouzols
committed
}
Federico Montesino Pouzols
committed
try {
ws->setTitle(Poco::Path(fileInfo.filePath).getFileName());
} catch (std::runtime_error &) {
ws->setTitle(padZeros(newFileNumber, g_DIGIT_SIZE_APPEND));
}
++newFileNumber;
addAxesInfoAndLogs(ws, loadAsRectImg, fileInfo, binSize, cmpp);
return ws;
}
Federico Montesino Pouzols
committed
* Add information to the workspace being loaded: labels, units, logs related to
* the image size, etc.
*
* @param ws workspace to manipulate
* @param loadAsRectImg if true, the workspace has one spectrum per
* row and one bin per column
*
* @param fileInfo information for the current file
*
* @param binSize size to rebin (1 == no re-bin == default)
*
* @param cmpp centimeters per pixel (already taking into account
* possible rebinning)
*/
void LoadFITS::addAxesInfoAndLogs(Workspace2D_sptr ws, bool loadAsRectImg,
const FITSInfo &fileInfo, int binSize,
double cmpp) {
Federico Montesino Pouzols
committed
// add axes
size_t width = fileInfo.axisPixelLengths[0] / binSize;
size_t height = fileInfo.axisPixelLengths[1] / binSize;
Federico Montesino Pouzols
committed
if (loadAsRectImg) {
// width/X axis
auto axw = new Mantid::API::NumericAxis(width + 1);
axw->title() = "width";
for (size_t i = 0; i < width + 1; i++) {
axw->setValue(i, static_cast<double>(i) * cmpp);
}
ws->replaceAxis(0, axw);
// "cm" width label unit
boost::shared_ptr<Kernel::Units::Label> unitLbl =
boost::dynamic_pointer_cast<Kernel::Units::Label>(
UnitFactory::Instance().create("Label"));
unitLbl->setLabel("width", "cm");
ws->getAxis(0)->unit() = unitLbl;
// height/Y axis
auto axh = new Mantid::API::NumericAxis(height);
axh->title() = "height";
for (size_t i = 0; i < height; i++) {
axh->setValue(i, static_cast<double>(i) * cmpp);
}
ws->replaceAxis(1, axh);
// "cm" height label unit
unitLbl = boost::dynamic_pointer_cast<Kernel::Units::Label>(
Federico Montesino Pouzols
committed
UnitFactory::Instance().create("Label"));
Federico Montesino Pouzols
committed
unitLbl->setLabel("height", "cm");
ws->getAxis(1)->unit() = unitLbl;
ws->isDistribution(true);
} else {
// TODO: what to do when loading 1pixel - 1 spectrum?
Federico Montesino Pouzols
committed
}
ws->setYUnitLabel("brightness");
Federico Montesino Pouzols
committed
// Add all header info to log.
for (auto it = fileInfo.headerKeys.begin(); it != fileInfo.headerKeys.end();
++it) {
ws->mutableRun().removeLogData(it->first, true);
new PropertyWithValue<std::string>(it->first, it->second));
}
// Add rotational data to log. Clear first from copied WS
auto it = fileInfo.headerKeys.find(m_sampleRotation);
ws->mutableRun().removeLogData("Rotation", true);
if (fileInfo.headerKeys.end() != it) {
double rot = boost::lexical_cast<double>(it->second);
if (rot >= 0) {
ws->mutableRun().addLogData(
new PropertyWithValue<double>("Rotation", rot));
}
}
// Add axis information to log. Clear first from copied WS
ws->mutableRun().removeLogData("Axis1", true);
ws->mutableRun().addLogData(new PropertyWithValue<int>(
"Axis1", static_cast<int>(fileInfo.axisPixelLengths[0])));
ws->mutableRun().removeLogData("Axis2", true);
ws->mutableRun().addLogData(new PropertyWithValue<int>(
"Axis2", static_cast<int>(fileInfo.axisPixelLengths[1])));
// Add image key data to log. Clear first from copied WS
ws->mutableRun().removeLogData("ImageKey", true);
Federico Montesino Pouzols
committed
ws->mutableRun().addLogData(
new PropertyWithValue<std::string>("ImageKey", fileInfo.imageKey));
Federico Montesino Pouzols
committed
* Reads the data (FITS matrix) from a single FITS file into a
* workspace (directly into the spectra, using one spectrum per image
* row).
Federico Montesino Pouzols
committed
* @param fileInfo information on the FITS file to load, including its path
Federico Montesino Pouzols
committed
* @param cmpp centimeters per pixel, to scale/normalize values
Federico Montesino Pouzols
committed
* @param ws workspace with the required dimensions
* @param buffer pre-allocated buffer to read from file
*
* @throws std::runtime_error if there are file input issues
Federico Montesino Pouzols
committed
void LoadFITS::readDataToWorkspace(const FITSInfo &fileInfo, double cmpp,
Workspace2D_sptr ws,
std::vector<char> &buffer) {
const size_t bytespp = (fileInfo.bitsPerPixel / 8);
const size_t len = m_pixelCount * bytespp;
Federico Montesino Pouzols
committed
readInBuffer(fileInfo, buffer, len);
const size_t nrows(fileInfo.axisPixelLengths[1]),
uint8_t *buffer8 = reinterpret_cast<uint8_t *>(&buffer.front());
Federico Montesino Pouzols
committed
PARALLEL_FOR_NO_WSP_CHECK()
for (int i = 0; i < static_cast<int>(nrows); ++i) {
Federico Montesino Pouzols
committed
Mantid::API::ISpectrum *specRow = ws->getSpectrum(i);
auto &dataX = specRow->dataX();
auto &dataY = specRow->dataY();
auto &dataE = specRow->dataE();
std::fill(dataX.begin(), dataX.end(), static_cast<double>(i) * cmpp);
for (size_t j = 0; j < ncols; ++j) {
// Map from 2D->1D index
const size_t start = ((i * (bytespp)) * nrows) + (j * (bytespp));
uint8_t const *const buffer8Start = buffer8 + start;
// Reverse byte order of current value. Make sure we allocate enough
// enough space to hold the size
boost::scoped_ptr<uint8_t> byteValue(new uint8_t[bytespp]);
std::reverse_copy(buffer8Start, buffer8Start + bytespp, byteValue.get());
Federico Montesino Pouzols
committed
double val = 0;
if (fileInfo.bitsPerPixel == 8) {
val = toDouble<uint8_t>(byteValue.get());
} else if (fileInfo.bitsPerPixel == 16) {
val = toDouble<uint16_t>(byteValue.get());
} else if (fileInfo.bitsPerPixel == 32 && !fileInfo.isFloat) {
val = toDouble<uint32_t>(byteValue.get());
} else if (fileInfo.bitsPerPixel == 64 && !fileInfo.isFloat) {
val = toDouble<uint32_t>(byteValue.get());
} else if (fileInfo.bitsPerPixel == 32 && fileInfo.isFloat) {
val = toDouble<float>(byteValue.get());
Federico Montesino Pouzols
committed
} else if (fileInfo.bitsPerPixel == 64 && fileInfo.isFloat) {
val = toDouble<double>(byteValue.get());
val = fileInfo.scale * val - fileInfo.offset;
Federico Montesino Pouzols
committed
}
Federico Montesino Pouzols
committed
/**
* Reads the data (FITS matrix) from a single FITS file into image
* objects (Y and E). E is filled with the sqrt() of Y.
*
* @param fileInfo information on the FITS file to load, including its path
* @param imageY Object to set the Y data values in
* @param imageE Object to set the E data values in
* @param buffer pre-allocated buffer to contain data values
*
* @throws std::runtime_error if there are file input issues
*/
void LoadFITS::readDataToImgs(const FITSInfo &fileInfo, MantidImage &imageY,
MantidImage &imageE, std::vector<char> &buffer) {
size_t bytespp = (fileInfo.bitsPerPixel / 8);
size_t len = m_pixelCount * bytespp;
readInBuffer(fileInfo, buffer, len);
// create pointer of correct data type to void pointer of the buffer:
uint8_t *buffer8 = reinterpret_cast<uint8_t *>(&buffer[0]);
std::vector<char> buf(bytespp);
char *tmp = &buf.front();
size_t start = 0;
for (size_t i = 0; i < fileInfo.axisPixelLengths[1]; ++i) { // width
Federico Montesino Pouzols
committed
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
for (size_t j = 0; j < fileInfo.axisPixelLengths[0]; ++j) { // height
// If you wanted to PARALLEL_...ize these loops (which doesn't
// seem to provide any speed up when loading images one at a
// time, you cannot use the start+=bytespp at the end of this
// loop. You'd need something like this:
//
// size_t start =
// ((i * (bytespp)) * fileInfo.axisPixelLengths[1]) +
// (j * (bytespp));
// Reverse byte order of current value
std::reverse_copy(buffer8 + start, buffer8 + start + bytespp, tmp);
double val = 0;
if (fileInfo.bitsPerPixel == 8)
val = static_cast<double>(*reinterpret_cast<uint8_t *>(tmp));
if (fileInfo.bitsPerPixel == 16)
val = static_cast<double>(*reinterpret_cast<uint16_t *>(tmp));
if (fileInfo.bitsPerPixel == 32 && !fileInfo.isFloat)
val = static_cast<double>(*reinterpret_cast<uint32_t *>(tmp));
if (fileInfo.bitsPerPixel == 64 && !fileInfo.isFloat)
val = static_cast<double>(*reinterpret_cast<uint64_t *>(tmp));
// cppcheck doesn't realise that these are safe casts
if (fileInfo.bitsPerPixel == 32 && fileInfo.isFloat) {
// cppcheck-suppress invalidPointerCast
val = static_cast<double>(*reinterpret_cast<float *>(tmp));
}
if (fileInfo.bitsPerPixel == 64 && fileInfo.isFloat) {
// cppcheck-suppress invalidPointerCast
val = *reinterpret_cast<double *>(tmp);
}
val = fileInfo.scale * val - fileInfo.offset;
imageY[i][j] = val;
imageE[i][j] = sqrt(val);
start += bytespp;
}
}
}
/**
* Reads the data (FITS matrix) from a single FITS file into a
* buffer. This simply reads the raw block of data, without doing any
* re-scaling or adjustment.
*
* @param fileInfo information on the FITS file to load, including its path
* @param buffer pre-allocated buffer where to read data
* @param len amount of chars/bytes/octets to read
*
* @throws std::runtime_error if there are file input issues
*/
void LoadFITS::readInBuffer(const FITSInfo &fileInfo, std::vector<char> &buffer,
size_t len) {
std::string filename = fileInfo.filePath;
Poco::FileStream file(filename, std::ios::in);
file.seekg(g_BASE_HEADER_SIZE * fileInfo.headerSizeMultiplier);
file.read(&buffer[0], len);
if (!file) {
throw std::runtime_error(
"Error while reading file: " + filename + ". Tried to read " +
boost::lexical_cast<std::string>(len) + " bytes but got " +
boost::lexical_cast<std::string>(file.gcount()) +
" bytes. The file and/or its headers may be wrong.");
}
// all is loaded
file.close();
}
Federico Montesino Pouzols
committed
/**
* Apply a simple noise filter by averaging threshold-filtered
Federico Montesino Pouzols
committed
* neighbor pixels (with 4-neighbohood / 4-connectivity). The
* filtering is done in place for both imageY and imageE.
Federico Montesino Pouzols
committed
*
* @param thresh Threshold to apply on pixels
* @param imageY raw data (Y values)
* @param imageE raw data (E/error values)
Federico Montesino Pouzols
committed
*/
Federico Montesino Pouzols
committed
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
void LoadFITS::doFilterNoise(double thresh, MantidImage &imageY,
MantidImage &imageE) {
if (thresh <= 0.0)
return;
MantidImage goodY = imageY;
MantidImage goodE = imageE;
// TODO: this is not very smart about the edge pixels (leftmost and
// rightmost columns, topmost and bottom rows)
for (size_t j = 1; j < (imageY.size() - 1); ++j) {
for (size_t i = 1; i < (imageY[0].size() - 1); ++i) {
if (((imageY[j][i] - imageY[j][i - 1]) > thresh) &&
((imageY[j][i] - imageY[j][i + 1]) > thresh) &&
((imageY[j][i] - imageY[j - 1][i]) > thresh) &&
((imageY[j][i] - imageY[j + 1][i]) > thresh))
goodY[j][i] = 0;
else
goodY[j][i] = 1;
if (((imageE[j][i] - imageE[j][i - 1]) > thresh) &&
((imageE[j][i] - imageE[j][i + 1]) > thresh) &&
((imageE[j][i] - imageE[j - 1][i]) > thresh) &&
((imageE[j][i] - imageE[j + 1][i]) > thresh))
goodE[j][i] = 0;
else
goodE[j][i] = 1;
}
}
for (size_t j = 1; j < (imageY.size() - 1); ++j) {
for (size_t i = 1; i < (imageY[0].size() - 1); ++i) {
if (!goodY[j][i]) {
if (goodY[j - 1][i] || goodY[j + 1][i] || goodY[j][i - 1] ||
goodY[j][i + 1]) {
imageY[j][i] = goodY[j - 1][i] * imageY[j - 1][i] +
goodY[j + 1][i] * imageY[j + 1][i] +
goodY[j][i - 1] * imageY[j][i - 1] +
goodY[j][i + 1] * imageY[j][i + 1];
}
}
if (!goodE[j][i]) {
if (goodE[j - 1][i] || goodE[j + 1][i] || goodE[j][i - 1] ||
goodE[j][i + 1]) {
imageE[j][i] = goodE[j - 1][i] * imageE[j - 1][i] +
goodE[j + 1][i] * imageE[j + 1][i] +
goodE[j][i - 1] * imageE[j][i - 1] +
goodE[j][i + 1] * imageE[j][i + 1];
}
}
}
Federico Montesino Pouzols
committed
}
}
/**
Federico Montesino Pouzols
committed
* Group pixels in blocks of rebin X rebin.