src/gdcmParser.cxx

   1 // gdcmHeader.cxx
   2 //-----------------------------------------------------------------------------
   3 #include "gdcmParser.h"
   4 #include "gdcmUtil.h"
   5 #include <errno.h>
   6
   7 // For nthos:
   8 #ifdef _MSC_VER
   9    #include <winsock.h>
  10 #else
  11    #include <netinet/in.h>
  12 #endif
  13
  14 #ifdef GDCM_NO_ANSI_STRING_STREAM
  15 #  include <strstream>
  16 #  define  ostringstream ostrstream
  17 # else
  18 #  include <sstream>
  19 #endif
  20 #  include <iomanip>
  21
  22 #define UI1_2_840_10008_1_2      "1.2.840.10008.1.2"
  23 #define UI1_2_840_10008_1_2_1    "1.2.840.10008.1.2.1"
  24 #define UI1_2_840_10008_1_2_2    "1.2.840.10008.1.2.2"
  25 #define UI1_2_840_10008_1_2_1_99 "1.2.840.10008.1.2.1.99"
  26
  27    // Fourth semantics:
  28    //
  29    // ---> Warning : This fourth field is NOT part
  30    //                of the 'official' Dicom Dictionnary
  31    //                and should NOT be used.
  32    //                (Not defined for all the groups
  33    //                 may be removed in a future release)
  34    //
  35    // CMD      Command
  36    // META     Meta Information
  37    // DIR      Directory
  38    // ID
  39    // PAT      Patient
  40    // ACQ      Acquisition
  41    // REL      Related
  42    // IMG      Image
  43    // SDY      Study
  44    // VIS      Visit
  45    // WAV      Waveform
  46    // PRC
  47    // DEV      Device
  48    // NMI      Nuclear Medicine
  49    // MED
  50    // BFS      Basic Film Session
  51    // BFB      Basic Film Box
  52    // BIB      Basic Image Box
  53    // BAB
  54    // IOB
  55    // PJ
  56    // PRINTER
  57    // RT       Radio Therapy
  58    // DVH
  59    // SSET
  60    // RES      Results
  61    // CRV      Curve
  62    // OLY      Overlays
  63    // PXL      Pixels
  64    // DL       Delimiters
  65    //
  66
  67 //-----------------------------------------------------------------------------
  68 // Refer to gdcmParser::CheckSwap()
  69 const unsigned int gdcmParser::HEADER_LENGTH_TO_READ = 256;
  70
  71 // Refer to gdcmParser::SetMaxSizeLoadEntry()
  72 const unsigned int gdcmParser::MAX_SIZE_LOAD_ELEMENT_VALUE = 4096;
  73
  74 // Refer to gdcmParser::SetMaxSizePrintEntry()
  75 // TODO : Right now, better see "define, in gdcmHederEntry.cxx
  76 const unsigned int gdcmParser::MAX_SIZE_PRINT_ELEMENT_VALUE = 64;
  77
  78 //-----------------------------------------------------------------------------
  79 // Constructor / Destructor
  80 /**
  81  * \ingroup gdcmParser
  82  * \brief
  83  * @param   InFilename
  84  * @param   exception_on_error
  85  * @param   enable_sequences = true to allow the header
  86  *          to be parsed *inside* the SeQuences,
  87  *          when they have an actual length
  88  * @param ignore_shadow to allow skipping the shadow elements,
  89  *           to save memory space.
  90  * \warning  The TRUE value for this param has to be used
  91  *           with a FALSE value for the 'enable_sequence' param.
  92  *           ('public elements' may be embedded in 'shadow Sequences')
  93  */
  94 gdcmParser::gdcmParser(const char *InFilename,
  95                        bool exception_on_error,
  96                        bool enable_sequences,
  97                        bool ignore_shadow) {
  98    enableSequences=enable_sequences;
  99    ignoreShadow   =ignore_shadow;
 100
 101    SetMaxSizeLoadEntry(MAX_SIZE_LOAD_ELEMENT_VALUE);
 102    filename = InFilename;
 103    Initialise();
 104
 105    if ( !OpenFile(exception_on_error))
 106       return;
 107    if (ParseHeader()) {
 108      LoadHeaderEntries();
 109    }
 110    CloseFile();
 111
 112    wasUpdated = 0;  // will be set to 1 if user adds an entry
 113    printLevel = 1;  // 'Medium' print level by default
 114 }
 115
 116 /**
 117  * \ingroup gdcmParser
 118  * \brief
 119  * @param   exception_on_error
 120  */
 121 gdcmParser::gdcmParser(bool exception_on_error) {
 122    enableSequences=0;
 123
 124    SetMaxSizeLoadEntry(MAX_SIZE_LOAD_ELEMENT_VALUE);
 125    Initialise();
 126
 127    wasUpdated = 0;  // will be set to 1 if user adds an entry
 128    printLevel = 1;  // 'Medium' print level by default
 129 }
 130
 131 /**
 132  * \ingroup gdcmParser
 133  * \brief   Canonical destructor.
 134  */
 135 gdcmParser::~gdcmParser (void) {
 136    RefPubDict = NULL;
 137    RefShaDict = NULL;
 138 }
 139
 140 //-----------------------------------------------------------------------------
 141 // Print
 142 /**
 143   * \ingroup gdcmParser
 144   * \brief   Prints the Header Entries (Dicom Elements)
 145   *          both from the H Table and the chained list
 146   * @return
 147   */
 148 void gdcmParser::PrintEntry(std::ostream & os) {
 149    std::ostringstream s;
 150
 151    for (ListTag::iterator i = listEntries.begin();
 152            i != listEntries.end();
 153            ++i)
 154    {
 155            (*i)->SetPrintLevel(printLevel);
 156            (*i)->Print(os);
 157    }
 158    os<<s.str();
 159 }
 160
 161 /**
 162   * \ingroup gdcmParser
 163   * \brief   Prints The Dict Entries of THE public Dicom Dictionnry
 164   * @return
 165   */
 166 void gdcmParser::PrintPubDict(std::ostream & os) {
 167    RefPubDict->Print(os);
 168 }
 169
 170 /**
 171   * \ingroup gdcmParser
 172   * \brief   Prints The Dict Entries of THE shadow Dicom Dictionnry
 173   * @return
 174   */
 175 void gdcmParser::PrintShaDict(std::ostream & os) {
 176    RefShaDict->Print(os);
 177 }
 178
 179 //-----------------------------------------------------------------------------
 180 // Public
 181 /**
 182  * \ingroup gdcmParser
 183  * \brief   Get the public dictionary used
 184  */
 185 gdcmDict *gdcmParser::GetPubDict(void) {
 186    return(RefPubDict);
 187 }
 188
 189 /**
 190  * \ingroup gdcmParser
 191  * \brief   Get the shadow dictionary used
 192  */
 193 gdcmDict *gdcmParser::GetShaDict(void) {
 194    return(RefShaDict);
 195 }
 196
 197 /**
 198  * \ingroup gdcmParser
 199  * \brief   Set the shadow dictionary used
 200  * \param   dict dictionary to use in shadow
 201  */
 202 bool gdcmParser::SetShaDict(gdcmDict *dict){
 203    RefShaDict=dict;
 204    return(!RefShaDict);
 205 }
 206
 207 /**
 208  * \ingroup gdcmParser
 209  * \brief   Set the shadow dictionary used
 210  * \param   dictName name of the dictionary to use in shadow
 211  */
 212 bool gdcmParser::SetShaDict(DictKey dictName){
 213    RefShaDict=gdcmGlobal::GetDicts()->GetDict(dictName);
 214    return(!RefShaDict);
 215 }
 216
 217 /**
 218  * \ingroup gdcmParser
 219  * \brief  This predicate, based on hopefully reasonable heuristics,
 220  *         decides whether or not the current gdcmParser was properly parsed
 221  *         and contains the mandatory information for being considered as
 222  *         a well formed and usable Dicom/Acr File.
 223  * @return true when gdcmParser is the one of a reasonable Dicom/Acr file,
 224  *         false otherwise.
 225  */
 226 bool gdcmParser::IsReadable(void) {
 227    if(filetype==Unknown) {
 228       return(false);
 229    }
 230    if(listEntries.size()<=0) {
 231       return(false);
 232    }
 233
 234    return(true);
 235 }
 236
 237 /**
 238  * \ingroup gdcmParser
 239  * \brief   Determines if the Transfer Syntax was already encountered
 240  *          and if it corresponds to a ImplicitVRLittleEndian one.
 241  *
 242  * @return  True when ImplicitVRLittleEndian found. False in all other cases.
 243  */
 244 bool gdcmParser::IsImplicitVRLittleEndianTransferSyntax(void) {
 245    gdcmHeaderEntry *Element = GetHeaderEntryByNumber(0x0002, 0x0010);
 246    if ( !Element )
 247       return false;
 248    LoadHeaderEntrySafe(Element);
 249
 250    std::string Transfer = Element->GetValue();
 251    if ( Transfer == UI1_2_840_10008_1_2 )
 252       return true;
 253    return false;
 254 }
 255
 256 /**
 257  * \ingroup gdcmParser
 258  * \brief   Determines if the Transfer Syntax was already encountered
 259  *          and if it corresponds to a ExplicitVRLittleEndian one.
 260  *
 261  * @return  True when ExplicitVRLittleEndian found. False in all other cases.
 262  */
 263 bool gdcmParser::IsExplicitVRLittleEndianTransferSyntax(void) {
 264    gdcmHeaderEntry* Element = GetHeaderEntryByNumber(0x0002, 0x0010);
 265    if ( !Element )
 266       return false;
 267    LoadHeaderEntrySafe(Element);
 268
 269    std::string Transfer = Element->GetValue();
 270    if ( Transfer == UI1_2_840_10008_1_2_1 )
 271       return true;
 272    return false;
 273 }
 274
 275 /**
 276  * \ingroup gdcmParser
 277  * \brief   Determines if the Transfer Syntax was already encountered
 278  *          and if it corresponds to a DeflatedExplicitVRLittleEndian one.
 279  *
 280  * @return  True when DeflatedExplicitVRLittleEndian found. False in all other cases.
 281  */
 282 bool gdcmParser::IsDeflatedExplicitVRLittleEndianTransferSyntax(void) {
 283    gdcmHeaderEntry* Element = GetHeaderEntryByNumber(0x0002, 0x0010);
 284    if ( !Element )
 285       return false;
 286    LoadHeaderEntrySafe(Element);
 287
 288    std::string Transfer = Element->GetValue();
 289    if ( Transfer == UI1_2_840_10008_1_2_1_99 )
 290       return true;
 291    return false;
 292 }
 293
 294 /**
 295  * \ingroup gdcmParser
 296  * \brief   Determines if the Transfer Syntax was already encountered
 297  *          and if it corresponds to a Explicit VR Big Endian one.
 298  *
 299  * @return  True when big endian found. False in all other cases.
 300  */
 301 bool gdcmParser::IsExplicitVRBigEndianTransferSyntax(void) {
 302    gdcmHeaderEntry* Element = GetHeaderEntryByNumber(0x0002, 0x0010);
 303    if ( !Element )
 304       return false;
 305    LoadHeaderEntrySafe(Element);
 306
 307    std::string Transfer = Element->GetValue();
 308    if ( Transfer == UI1_2_840_10008_1_2_2 )  //1.2.2 ??? A verifier !
 309       return true;
 310    return false;
 311 }
 312
 313 /**
 314  * \ingroup gdcmParser
 315  * \brief  returns the File Type
 316  *         (ACR, ACR_LIBIDO, ExplicitVR, ImplicitVR, Unknown)
 317  * @return
 318  */
 319 FileType gdcmParser::GetFileType(void) {
 320    return(filetype);
 321 }
 322
 323 /**
 324  * \ingroup gdcmParser
 325  * \brief   opens the file
 326  * @param   exception_on_error
 327  * @return
 328  */
 329 FILE *gdcmParser::OpenFile(bool exception_on_error)
 330   throw(gdcmFileError)
 331 {
 332   fp=fopen(filename.c_str(),"rb");
 333   if(exception_on_error)
 334   {
 335     if(!fp)
 336       throw gdcmFileError("gdcmParser::gdcmParser(const char *, bool)");
 337   }
 338
 339   if ( fp )
 340   {
 341      guint16 zero;
 342      fread(&zero,  (size_t)2, (size_t)1, fp);
 343
 344     //ACR -- or DICOM with no Preamble --
 345     if( zero == 0x0008 || zero == 0x0800 || zero == 0x0002 || zero == 0x0200)
 346        return(fp);
 347
 348     //DICOM
 349     fseek(fp, 126L, SEEK_CUR);
 350     char dicm[4];
 351     fread(dicm,  (size_t)4, (size_t)1, fp);
 352     if( memcmp(dicm, "DICM", 4) == 0 )
 353        return(fp);
 354
 355     fclose(fp);
 356     dbg.Verbose(0, "gdcmParser::gdcmParser not DICOM/ACR", filename.c_str());
 357   }
 358   else {
 359     dbg.Verbose(0, "gdcmParser::gdcmParser cannot open file", filename.c_str());
 360   }
 361   return(NULL);
 362 }
 363
 364 /**
 365  * \ingroup gdcmParser
 366  * \brief closes the file
 367  * @return  TRUE if the close was successfull
 368  */
 369 bool gdcmParser::CloseFile(void) {
 370   int closed = fclose(fp);
 371   fp = (FILE *)0;
 372   if (! closed)
 373      return false;
 374   return true;
 375 }
 376
 377 /**
 378  * \ingroup gdcmParser
 379  * \brief
 380  * @param fp file pointer on an already open file
 381  * @param   type type of the File to be written
 382  *          (ACR-NEMA, ExplicitVR, ImplicitVR)
 383  * @return  always "True" ?!
 384  */
 385 bool gdcmParser::Write(FILE *fp, FileType type) {
 386 // ==============
 387 // TODO The stuff was rewritten using the chained list instead
 388 //      of the H table
 389 //      so we could remove the GroupHT from the gdcmParser
 390 // To be checked
 391 // =============
 392
 393    // TODO : move the following lines (and a lot of others, to be written)
 394    // to a future function CheckAndCorrectHeader
 395
 396         // Question :
 397         // Comment pourrait-on savoir si le DcmHeader vient d'un fichier DicomV3 ou non
 398         // (FileType est un champ de gdcmParser ...)
 399         // WARNING : Si on veut ecrire du DICOM V3 a partir d'un DcmHeader ACR-NEMA
 400         // no way
 401         // a moins de se livrer a un tres complique ajout des champs manquants.
 402         // faire un CheckAndCorrectHeader (?)
 403
 404
 405    if (type == ImplicitVR)
 406    {
 407       std::string implicitVRTransfertSyntax = UI1_2_840_10008_1_2;
 408       ReplaceOrCreateByNumber(implicitVRTransfertSyntax,0x0002, 0x0010);
 409
 410       //FIXME Refer to standards on page 21, chapter 6.2 "Value representation":
 411       //      values with a VR of UI shall be padded with a single trailing null
 412       //      Dans le cas suivant on doit pader manuellement avec un 0
 413
 414       SetEntryLengthByNumber(18, 0x0002, 0x0010);
 415    }
 416
 417    if (type == ExplicitVR)
 418    {
 419       std::string explicitVRTransfertSyntax = UI1_2_840_10008_1_2_1;
 420       ReplaceOrCreateByNumber(explicitVRTransfertSyntax,0x0002, 0x0010);
 421
 422       //FIXME Refer to standards on page 21, chapter 6.2 "Value representation":
 423       //      values with a VR of UI shall be padded with a single trailing null
 424       //      Dans le cas suivant on doit pader manuellement avec un 0
 425
 426       SetEntryLengthByNumber(20, 0x0002, 0x0010);
 427    }
 428
 429 /* TODO : rewrite later
 430
 431    if ( (type == ImplicitVR) || (type == ExplicitVR) )
 432       UpdateGroupLength(false,type);
 433    if ( type == ACR)
 434       UpdateGroupLength(true,ACR);
 435 */
 436
 437    WriteEntries(type, fp);
 438    return(true);
 439  }
 440
 441 /**
 442  * \ingroup gdcmParser
 443  * \brief   Modifies the value of a given Header Entry (Dicom Element)
 444  *          if it exists; Creates it with the given value if it doesn't
 445  * @param   Value passed as a std::string
 446  * @param   Group
 447  * @param   Elem
 448  * \return  boolean
 449  */
 450 bool gdcmParser::ReplaceOrCreateByNumber(std::string Value,
 451                                          guint16 Group,
 452                                          guint16 Elem ){
 453    if (CheckIfEntryExistByNumber(Group, Elem) == 0) {
 454       gdcmHeaderEntry *a =NewHeaderEntryByNumber(Group, Elem);
 455       if (a == NULL)
 456          return false;
 457       AddHeaderEntry(a);
 458    }
 459    SetEntryByNumber(Value, Group, Elem);
 460    return(true);
 461 }
 462
 463 /**
 464  * \ingroup gdcmParser
 465  * \brief   Modifies the value of a given Header Entry (Dicom Element)
 466  *          if it exists; Creates it with the given value if it doesn't
 467  * @param   Value passed as a char*
 468  * @param   Group
 469  * @param   Elem
 470  * \return  boolean
 471  *
 472  */
 473 bool gdcmParser::ReplaceOrCreateByNumber(char* Value, guint16 Group, guint16 Elem ) {
 474    gdcmHeaderEntry* nvHeaderEntry=NewHeaderEntryByNumber(Group, Elem);
 475
 476    if(!nvHeaderEntry)
 477       return(false);
 478
 479    AddHeaderEntry(nvHeaderEntry);
 480
 481    std::string v = Value;
 482    SetEntryByNumber(v, Group, Elem);
 483    return(true);
 484 }
 485
 486 /**
 487  * \ingroup gdcmParser
 488  * \brief   Set a new value if the invoked element exists
 489  *          Seems to be useless !!!
 490  * @param   Value
 491  * @param   Group
 492  * @param   Elem
 493  * \return  boolean
 494  */
 495 bool gdcmParser::ReplaceIfExistByNumber(char* Value, guint16 Group, guint16 Elem )
 496 {
 497    std::string v = Value;
 498    SetEntryByNumber(v, Group, Elem);
 499    return true;
 500 }
 501
 502 //-----------------------------------------------------------------------------
 503 // Protected
 504 /**
 505  * \ingroup gdcmParser
 506  * \brief   Checks if a given Dicom Element exists
 507  * \        within the H table
 508  * @param   group Group   number of the searched Dicom Element
 509  * @param   element  Element number of the searched Dicom Element
 510  * @return  number of occurences
 511  */
 512 int gdcmParser::CheckIfEntryExistByNumber(guint16 group, guint16 element ) {
 513         std::string key = gdcmDictEntry::TranslateToKey(group, element );
 514         return (tagHT.count(key));
 515 }
 516
 517 /**
 518  * \ingroup gdcmParser
 519  * \brief   Searches within Header Entries (Dicom Elements) parsed with
 520  *          the public and private dictionaries
 521  *          for the element value of a given tag.
 522  * \warning Don't use any longer : use GetPubEntryByName
 523  * @param   tagName name of the searched element.
 524  * @return  Corresponding element value when it exists,
 525  *          and the string GDCM_UNFOUND ("gdcm::Unfound") otherwise.
 526  */
 527 std::string gdcmParser::GetEntryByName(std::string tagName) {
 528    gdcmDictEntry *dictEntry = RefPubDict->GetDictEntryByName(tagName);
 529    if( dictEntry == NULL)
 530       return GDCM_UNFOUND;
 531
 532    return(GetEntryByNumber(dictEntry->GetGroup(),dictEntry->GetElement()));
 533 }
 534
 535 /**
 536  * \ingroup gdcmParser
 537  * \brief   Searches within Header Entries (Dicom Elements) parsed with
 538  *          the public and private dictionaries
 539  *          for the element value representation of a given tag.
 540  *
 541  *          Obtaining the VR (Value Representation) might be needed by caller
 542  *          to convert the string typed content to caller's native type
 543  *          (think of C++ vs Python). The VR is actually of a higher level
 544  *          of semantics than just the native C++ type.
 545  * @param   tagName name of the searched element.
 546  * @return  Corresponding element value representation when it exists,
 547  *          and the string GDCM_UNFOUND ("gdcm::Unfound") otherwise.
 548  */
 549 std::string gdcmParser::GetEntryVRByName(std::string tagName) {
 550    gdcmDictEntry *dictEntry = RefPubDict->GetDictEntryByName(tagName);
 551    if( dictEntry == NULL)
 552       return GDCM_UNFOUND;
 553
 554    gdcmHeaderEntry* elem =  GetHeaderEntryByNumber(dictEntry->GetGroup(),
 555                                                    dictEntry->GetElement());
 556    return elem->GetVR();
 557 }
 558
 559 /**
 560  * \ingroup gdcmParser
 561  * \brief   Searches within Header Entries (Dicom Elements) parsed with
 562  *          the public and private dictionaries
 563  *          for the element value representation of a given tag.
 564  * @param   group Group of the searched tag.
 565  * @param   element Element of the searched tag.
 566  * @return  Corresponding element value representation when it exists,
 567  *          and the string GDCM_UNFOUND ("gdcm::Unfound") otherwise.
 568  */
 569 std::string gdcmParser::GetEntryByNumber(guint16 group, guint16 element){
 570    TagKey key = gdcmDictEntry::TranslateToKey(group, element);
 571    if ( ! tagHT.count(key))
 572       return GDCM_UNFOUND;
 573    return tagHT.find(key)->second->GetValue();
 574 }
 575
 576 /**
 577  * \ingroup gdcmParser
 578  * \brief   Searches within Header Entries (Dicom Elements) parsed with
 579  *          the public and private dictionaries
 580  *          for the element value representation of a given tag..
 581  *
 582  *          Obtaining the VR (Value Representation) might be needed by caller
 583  *          to convert the string typed content to caller's native type
 584  *          (think of C++ vs Python). The VR is actually of a higher level
 585  *          of semantics than just the native C++ type.
 586  * @param   group Group of the searched tag.
 587  * @param   element Element of the searched tag.
 588  * @return  Corresponding element value representation when it exists,
 589  *          and the string GDCM_UNFOUND ("gdcm::Unfound") otherwise.
 590  */
 591 std::string gdcmParser::GetEntryVRByNumber(guint16 group, guint16 element) {
 592    gdcmHeaderEntry* elem =  GetHeaderEntryByNumber(group, element);
 593    if ( !elem )
 594       return GDCM_UNFOUND;
 595    return elem->GetVR();
 596 }
 597
 598 /**
 599  * \ingroup gdcmParser
 600  * \brief   Sets the value (string) of the Header Entry (Dicom Element)
 601  * @param   content string value of the Dicom Element
 602  * @param   tagName name of the searched Dicom Element.
 603  * @return  true when found
 604  */
 605 bool gdcmParser::SetEntryByName(std::string content,std::string tagName) {
 606    gdcmDictEntry *dictEntry = RefPubDict->GetDictEntryByName(tagName);
 607    if( dictEntry == NULL)
 608       return false;
 609
 610    return(SetEntryByNumber(content,dictEntry->GetGroup(),
 611                                    dictEntry->GetElement()));
 612 }
 613
 614 /**
 615  * \ingroup gdcmParser
 616  * \brief   Accesses an existing gdcmHeaderEntry (i.e. a Dicom Element)
 617  *          through it's (group, element) and modifies it's content with
 618  *          the given value.
 619  * \warning Don't use any longer : use SetPubEntryByNumber
 620  * @param   content new value to substitute with
 621  * @param   group   group of the Dicom Element to modify
 622  * @param   element element of the Dicom Element to modify
 623  */
 624 bool gdcmParser::SetEntryByNumber(std::string content,
 625                                   guint16 group,
 626                                   guint16 element)
 627 {
 628    TagKey key = gdcmDictEntry::TranslateToKey(group, element);
 629    if ( ! tagHT.count(key))
 630       return false;
 631    int l = content.length();
 632    if(l%2) // Odd length are padded with a space (020H).
 633    {
 634       l++;
 635       content = content + '\0';
 636    }
 637
 638    gdcmHeaderEntry * a;
 639    IterHT p;
 640    TagHeaderEntryHT::iterator p2;
 641    // DO NOT remove the following lines : they explain the stuff
 642    //p= tagHT.equal_range(key); // get a pair of iterators first-last synonym
 643    //p2=p.first;                // iterator on the first synonym
 644    //a=p2->second;              // H Table target column (2-nd col)
 645
 646    // or, easier :
 647    a = ((tagHT.equal_range(key)).first)->second;
 648
 649    a-> SetValue(content);
 650
 651    std::string vr = a->GetVR();
 652
 653    guint32 lgr;
 654    if( (vr == "US") || (vr == "SS") )
 655       lgr = 2;
 656    else if( (vr == "UL") || (vr == "SL") )
 657       lgr = 4;
 658    else
 659       lgr = l;
 660
 661    a->SetLength(lgr);
 662    return true;
 663 }
 664
 665 /**
 666  * \ingroup gdcmParser
 667  * \brief   Accesses an existing gdcmHeaderEntry (i.e. a Dicom Element)
 668  *          in the PubHeaderEntrySet of this instance
 669  *          through it's (group, element) and modifies it's length with
 670  *          the given value.
 671  * \warning Use with extreme caution.
 672  * @param   length new length to substitute with
 673  * @param   group   group of the entry to modify
 674  * @param   element element of the Entry to modify
 675  * @return  1 on success, 0 otherwise.
 676  */
 677
 678 bool gdcmParser::SetEntryLengthByNumber(guint32 length,
 679                                         guint16 group,
 680                                         guint16 element)
 681 {
 682    TagKey key = gdcmDictEntry::TranslateToKey(group, element);
 683    if ( ! tagHT.count(key))
 684       return false;
 685    if (length%2) length++; // length must be even
 686    ( ((tagHT.equal_range(key)).first)->second )->SetLength(length);
 687
 688    return true ;
 689 }
 690
 691 /**
 692  * \ingroup gdcmParser
 693  * \brief   Gets (from Header) the offset  of a 'non string' element value
 694  * \        (LoadElementValues has already be executed)
 695  * @param   Group
 696  * @param   Elem
 697  * @return File Offset of the Element Value
 698  */
 699 size_t gdcmParser::GetEntryOffsetByNumber(guint16 Group, guint16 Elem)
 700 {
 701    gdcmHeaderEntry* Entry = GetHeaderEntryByNumber(Group, Elem);
 702    if (!Entry)
 703    {
 704       dbg.Verbose(1, "gdcmParser::GetHeaderEntryByNumber",
 705                       "failed to Locate gdcmHeaderEntry");
 706       return (size_t)0;
 707    }
 708    return Entry->GetOffset();
 709 }
 710
 711 /**
 712  * \ingroup gdcmParser
 713  * \brief   Gets (from Header) a 'non string' element value
 714  * \        (LoadElementValues has already be executed)
 715  * @param   Group
 716  * @param   Elem
 717  * @return Pointer to the 'non string' area
 718  */
 719 void * gdcmParser::GetEntryVoidAreaByNumber(guint16 Group, guint16 Elem)
 720 {
 721    gdcmHeaderEntry* Entry = GetHeaderEntryByNumber(Group, Elem);
 722    if (!Entry)
 723    {
 724       dbg.Verbose(1, "gdcmParser::GetHeaderEntryByNumber",
 725                   "failed to Locate gdcmHeaderEntry");
 726       return (NULL);
 727    }
 728    return Entry->GetVoidArea();
 729 }
 730
 731 /**
 732  * \ingroup       gdcmParser
 733  * \brief         Loads (from disk) the element content
 734  *                when a string is not suitable
 735  * @param   Group
 736  * @param   Elem
 737  */
 738 void *gdcmParser::LoadEntryVoidArea(guint16 Group, guint16 Elem)
 739 {
 740    gdcmHeaderEntry * Element= GetHeaderEntryByNumber(Group, Elem);
 741    if ( !Element )
 742       return NULL;
 743    size_t o =(size_t)Element->GetOffset();
 744    fseek(fp, o, SEEK_SET);
 745    int l=Element->GetLength();
 746    void * a = malloc(l);
 747    if(!a)
 748         return NULL;
 749
 750    SetEntryVoidAreaByNumber(a, Group, Elem);
 751    // TODO check the result
 752    size_t l2 = fread(a, 1, l ,fp);
 753    if(l != l2)
 754    {
 755         free(a);
 756         return NULL;
 757    }
 758    return a;
 759 }
 760
 761 /**
 762  * \ingroup gdcmParser
 763  * \brief   Sets a 'non string' value to a given Dicom Element
 764  * @param   area
 765  * @param   group Group number of the searched Dicom Element
 766  * @param   element Element number of the searched Dicom Element
 767  * @return
 768  */
 769 bool gdcmParser::SetEntryVoidAreaByNumber(void * area,
 770                                           guint16 group,
 771                                           guint16 element)
 772 {
 773    TagKey key = gdcmDictEntry::TranslateToKey(group, element);
 774    if ( ! tagHT.count(key))
 775       return false;
 776    ( ((tagHT.equal_range(key)).first)->second )->SetVoidArea(area);
 777    return true;
 778 }
 779
 780 /**
 781  * \ingroup gdcmParser
 782  * \brief   Update the entries with the shadow dictionary. Only odd entries are
 783  *          analized
 784  */
 785 void gdcmParser::UpdateShaEntries(void) {
 786    gdcmDictEntry *entry;
 787    std::string vr;
 788
 789    for(ListTag::iterator it=listEntries.begin();
 790        it!=listEntries.end();
 791        ++it)
 792    {
 793       // Odd group => from public dictionary
 794       if((*it)->GetGroup()%2==0)
 795          continue;
 796
 797       // Peer group => search the corresponding dict entry
 798       if(RefShaDict)
 799          entry=RefShaDict->GetDictEntryByNumber((*it)->GetGroup(),(*it)->GetElement());
 800       else
 801          entry=NULL;
 802
 803       if((*it)->IsImplicitVR())
 804          vr="Implicit";
 805       else
 806          vr=(*it)->GetVR();
 807
 808       (*it)->SetValue(GetHeaderEntryUnvalue(*it));
 809       if(entry){
 810          // Set the new entry and the new value
 811          (*it)->SetDictEntry(entry);
 812          CheckHeaderEntryVR(*it,vr);
 813
 814          (*it)->SetValue(GetHeaderEntryValue(*it));
 815       }
 816       else
 817       {
 818          // Remove precedent value transformation
 819          (*it)->SetDictEntry(NewVirtualDictEntry((*it)->GetGroup(),(*it)->GetElement(),vr));
 820       }
 821    }
 822 }
 823
 824 /**
 825  * \ingroup gdcmParser
 826  * \brief   Searches within the Header Entries for a Dicom Element of
 827  *          a given tag.
 828  * @param   tagName name of the searched Dicom Element.
 829  * @return  Corresponding Dicom Element when it exists, and NULL
 830  *          otherwise.
 831  */
 832  gdcmHeaderEntry *gdcmParser::GetHeaderEntryByName(std::string tagName) {
 833    gdcmDictEntry *dictEntry = RefPubDict->GetDictEntryByName(tagName);
 834    if( dictEntry == NULL)
 835       return NULL;
 836
 837   return(GetHeaderEntryByNumber(dictEntry->GetGroup(),dictEntry->GetElement()));
 838 }
 839
 840 /**
 841  * \ingroup gdcmParser
 842  * \brief  retrieves a Dicom Element (the first one) using (group, element)
 843  * \ warning (group, element) IS NOT an identifier inside the Dicom Header
 844  *           if you think it's NOT UNIQUE, check the count number
 845  *           and use iterators to retrieve ALL the Dicoms Elements within
 846  *           a given couple (group, element)
 847  * @param   group Group number of the searched Dicom Element
 848  * @param   element Element number of the searched Dicom Element
 849  * @return
 850  */
 851 gdcmHeaderEntry* gdcmParser::GetHeaderEntryByNumber(guint16 group, guint16 element)
 852 {
 853    TagKey key = gdcmDictEntry::TranslateToKey(group, element);
 854    if ( ! tagHT.count(key))
 855       return NULL;
 856    return tagHT.find(key)->second;
 857 }
 858
 859 /**
 860  * \ingroup gdcmParser
 861  * \brief   retrieves the Dicom Elements (all of them) using (group, element)
 862  * @param   group Group number of the searched Dicom Element.
 863  * @param   element Element number of the searched Dicom Element.
 864  * @return  a range (i.e.pair<,>) containing all elements whose key is group|element)
 865  */
 866
 867 IterHT gdcmParser::GetHeaderEntrySameNumber(guint16 group, guint16 element){
 868    TagKey key = gdcmDictEntry::TranslateToKey(group, element);
 869    return (tagHT.equal_range(key));
 870 }
 871
 872 /**
 873  * \ingroup       gdcmParser
 874  * \brief         Loads the element while preserving the current
 875  *                underlying file position indicator as opposed to
 876  *                to LoadHeaderEntry that modifies it.
 877  * @param entry   Header Entry whose value shall be loaded.
 878  * @return
 879  */
 880 void gdcmParser::LoadHeaderEntrySafe(gdcmHeaderEntry * entry) {
 881    long PositionOnEntry = ftell(fp);
 882    LoadHeaderEntry(entry);
 883    fseek(fp, PositionOnEntry, SEEK_SET);
 884 }
 885
 886 /**
 887  * \ingroup gdcmParser
 888  * \brief   Re-computes the length of a ACR-NEMA/Dicom group from a DcmHeader
 889  * \warning : to be re-written using the chained list instead of the H table.
 890  * \warning : DO NOT use (doesn't work any longer because of the multimap)
 891  * \todo : to be re-written using the chained list instead of the H table
 892  * @param   SkipSequence TRUE if we don't want to write Sequences (ACR-NEMA Files)
 893  * @param   type Type of the File (ExplicitVR,ImplicitVR, ACR, ...)
 894  */
 895 void gdcmParser::UpdateGroupLength(bool SkipSequence, FileType type) {
 896    guint16 gr, el;
 897    std::string vr;
 898
 899    gdcmHeaderEntry *elem;
 900    char trash[10];
 901    std::string str_trash;
 902
 903    GroupKey key;
 904    GroupHT groupHt;  // to hold the length of each group
 905    TagKey tk;
 906    // remember :
 907    // typedef std::map<GroupKey, int> GroupHT;
 908
 909    gdcmHeaderEntry *elemZ;
 910
 911    // for each Tag in the DCM Header
 912
 913    for (TagHeaderEntryHT::iterator tag2 = tagHT.begin();
 914         tag2 != tagHT.end();
 915         ++tag2)
 916    {
 917       elem  = tag2->second;
 918       gr = elem->GetGroup();
 919       el = elem->GetElement();
 920       vr = elem->GetVR();
 921
 922       sprintf(trash, "%04x", gr);
 923       key = trash;              // generate 'group tag'
 924
 925       // if the caller decided not to take SEQUENCEs into account
 926       // e.g : he wants to write an ACR-NEMA File
 927
 928       if (SkipSequence && vr == "SQ")
 929          continue;
 930
 931       // Still unsolved problem :
 932       // we cannot find the 'Sequence Delimitation Item'
 933       // since it's at the end of the Hash Table
 934       // (fffe,e0dd)
 935
 936       // pas SEQUENCE en ACR-NEMA
 937       // WARNING :
 938       // --> la descente a l'interieur' des SQ
 939       // devrait etre faite avec une liste chainee, pas avec une HTable...
 940
 941       if ( groupHt.count(key) == 0) // we just read the first elem of a given group
 942       {
 943          if (el == 0x0000) // the first elem is 0x0000
 944          {
 945             groupHt[key] = 0;         // initialize group length
 946          }
 947          else
 948          {
 949             groupHt[key] = 2 + 2 + 4 + elem->GetLength(); // non 0x0000 first group elem
 950          }
 951       }
 952       else // any elem but the first
 953       {
 954          if (type == ExplicitVR)
 955          {
 956             if ( (vr == "OB") || (vr == "OW") || (vr == "SQ") )
 957             {
 958                groupHt[key] +=  4; // explicit VR AND OB, OW, SQ : 4 more bytes
 959             }
 960          }
 961          groupHt[key] += 2 + 2 + 4 + elem->GetLength();
 962       }
 963    }
 964
 965    unsigned short int gr_bid;
 966
 967    for (GroupHT::iterator g = groupHt.begin(); // for each group we found
 968         g != groupHt.end();
 969         ++g)
 970    {
 971       // FIXME: g++ -Wall -Wstrict-prototypes reports on following line:
 972       //        warning: unsigned int format, different type arg
 973       sscanf(g->first.c_str(),"%x",&gr_bid);
 974       tk = g->first + "|0000";                  // generate the element full tag
 975
 976       if ( tagHT.count(tk) == 0) // if element 0x0000 not found
 977       {
 978          gdcmDictEntry * tagZ = new gdcmDictEntry(gr_bid, 0x0000, "UL");
 979          elemZ = new gdcmHeaderEntry(tagZ);
 980          elemZ->SetLength(4);
 981          AddHeaderEntry(elemZ);                         // create it
 982       }
 983       else
 984       {
 985          elemZ=GetHeaderEntryByNumber(gr_bid, 0x0000);
 986       }
 987       sprintf(trash ,"%d",g->second);
 988       str_trash=trash;
 989       elemZ->SetValue(str_trash);
 990    }
 991 }
 992
 993 /**
 994  * \ingroup gdcmParser
 995  * \brief   writes on disc according to the requested format
 996  * \        (ACR-NEMA, ExplicitVR, ImplicitVR) the image
 997  * \ warning does NOT add the missing elements in the header :
 998  * \         it's up to the user doing it !
 999  * \         (function CheckHeaderCoherence to be written)
1000  * \ warning DON'T try, right now, to write a DICOM image
1001  * \         from an ACR Header (meta elements will be missing!)
1002  * @param   type type of the File to be written
1003  *          (ACR-NEMA, ExplicitVR, ImplicitVR)
1004  * @param   _fp already open file pointer
1005  */
1006 void gdcmParser::WriteEntries(FileType type, FILE * _fp)
1007 {
1008    guint16 gr, el;
1009    guint32 lgr;
1010    const char * val;
1011    std::string vr;
1012    guint32 val_uint32;
1013    guint16 val_uint16;
1014    guint16 valZero =0;
1015    std::vector<std::string> tokens;
1016
1017    // TODO : function CheckHeaderCoherence to be written
1018
1019    //  uses now listEntries to iterate, not TagHt!
1020    //
1021    //        pb : gdcmParser.Add does NOT update listEntries
1022    //       TODO : find a trick (in STL?) to do it, at low cost !
1023
1024    void *ptr;
1025
1026    // TODO (?) tester les echecs en ecriture (apres chaque fwrite)
1027    int compte =0;
1028
1029    for (ListTag::iterator tag2=listEntries.begin();
1030         tag2 != listEntries.end();
1031         ++tag2)
1032    {
1033       gr =  (*tag2)->GetGroup();
1034       el =  (*tag2)->GetElement();
1035       lgr = (*tag2)->GetReadLength();
1036       val = (*tag2)->GetValue().c_str();
1037       vr =  (*tag2)->GetVR();
1038       if ( type == ACR )
1039       {
1040          if (gr < 0x0008)   continue; // ignore pure DICOM V3 groups
1041          if (gr %2)         continue; // ignore shadow groups
1042          if (vr == "SQ" )   continue; // ignore Sequences
1043                    // TODO : find a trick to *skip* the SeQuences !
1044                    // Not only ignore the SQ element
1045          if (gr == 0xfffe ) continue; // ignore delimiters
1046       }
1047
1048       fwrite ( &gr,(size_t)2 ,(size_t)1 ,_fp);  //group
1049       fwrite ( &el,(size_t)2 ,(size_t)1 ,_fp);  //element
1050
1051       // === Deal with the length
1052       //     --------------------
1053
1054       // if ( (type == ExplicitVR) && (gr <= 0x0002) ) // ?!?  < 2
1055       if ( (type == ExplicitVR) || (type == DICOMDIR) )
1056       {
1057          // EXPLICIT VR
1058          guint16 z=0, shortLgr;
1059          if (vr == "Unknown") { // Unknown was 'written'
1060             shortLgr=lgr;
1061             fwrite ( &shortLgr,(size_t)2 ,(size_t)1 ,_fp);
1062             fwrite ( &z,  (size_t)2 ,(size_t)1 ,_fp);
1063          } else {
1064             if (gr != 0xfffe) { // NO value for 'delimiters'
1065               if (vr == "Unknown") // Unknown was 'written'
1066                  fwrite(&z,(size_t)2 ,(size_t)1 ,_fp);
1067               else
1068                  fwrite (vr.c_str(),(size_t)2 ,(size_t)1 ,_fp);
1069             }
1070
1071             if ( (vr == "OB") || (vr == "OW") || (vr == "SQ") || gr == 0xfffe) // JPR
1072             {
1073                if (gr != 0xfffe)
1074                   fwrite ( &z,  (size_t)2 ,(size_t)1 ,_fp);
1075                fwrite ( &lgr,(size_t)4 ,(size_t)1 ,_fp);
1076             }
1077             else
1078             {
1079                shortLgr=lgr;
1080                fwrite ( &shortLgr,(size_t)2 ,(size_t)1 ,_fp);
1081             }
1082          }
1083       }
1084       else // IMPLICIT VR
1085       {
1086          fwrite ( &lgr,(size_t)4 ,(size_t)1 ,_fp);
1087       }
1088
1089       // === Deal with the value
1090       //     -------------------
1091       if (vr == "SQ")  continue; // no "value" to write for the SEQuences
1092       if (gr == 0xfffe)continue;
1093
1094       if (vr == "US" || vr == "SS")
1095       {
1096          tokens.erase(tokens.begin(),tokens.end()); // clean any previous value
1097          Tokenize ((*tag2)->GetValue(), tokens, "\\");
1098          for (unsigned int i=0; i<tokens.size();i++)
1099          {
1100             val_uint16 = atoi(tokens[i].c_str());
1101             ptr = &val_uint16;
1102             fwrite ( ptr,(size_t)2 ,(size_t)1 ,_fp);
1103          }
1104          tokens.clear();
1105          continue;
1106       }
1107       if (vr == "UL" || vr == "SL")
1108       {
1109          tokens.erase(tokens.begin(),tokens.end()); // clean any previous value
1110          Tokenize ((*tag2)->GetValue(), tokens, "\\");
1111          for (unsigned int i=0; i<tokens.size();i++)
1112          {
1113             val_uint32 = atoi(tokens[i].c_str());
1114             ptr = &val_uint32;
1115             fwrite ( ptr,(size_t)4 ,(size_t)1 ,_fp);
1116          }
1117          tokens.clear();
1118          continue;
1119       }
1120
1121       // Pixels are never loaded in the element !
1122       // we stop writting when Pixel are processed
1123       // FIX : we loose trailing elements (RAB, right now)
1124
1125       if ((gr == GrPixel) && (el == NumPixel) ) {
1126          compte++;
1127          if (compte == countGrPixel) // we passed *all* the GrPixel,NumPixel
1128             break;
1129       }
1130       fwrite ( val,(size_t)lgr ,(size_t)1 ,_fp); // Elem value
1131    }
1132 }
1133
1134 /**
1135  * \ingroup gdcmParser
1136  * \brief   Swaps back the bytes of 4-byte long integer accordingly to
1137  *          processor order.
1138  * @return  The properly swaped 32 bits integer.
1139  */
1140 guint32 gdcmParser::SwapLong(guint32 a) {
1141    switch (sw) {
1142       case    0 :
1143          break;
1144       case 4321 :
1145          a=( ((a<<24) & 0xff000000) | ((a<<8)  & 0x00ff0000) |
1146              ((a>>8)  & 0x0000ff00) | ((a>>24) & 0x000000ff) );
1147          break;
1148
1149       case 3412 :
1150          a=( ((a<<16) & 0xffff0000) | ((a>>16) & 0x0000ffff) );
1151          break;
1152
1153       case 2143 :
1154          a=( ((a<<8) & 0xff00ff00) | ((a>>8) & 0x00ff00ff)  );
1155          break;
1156       default :
1157          dbg.Error(" gdcmParser::SwapLong : unset swap code");
1158          a=0;
1159    }
1160    return(a);
1161 }
1162
1163 /**
1164  * \ingroup gdcmParser
1165  * \brief   Unswaps back the bytes of 4-byte long integer accordingly to
1166  *          processor order.
1167  * @return  The properly unswaped 32 bits integer.
1168  */
1169 guint32 gdcmParser::UnswapLong(guint32 a) {
1170    return (SwapLong(a));
1171 }
1172
1173 /**
1174  * \ingroup gdcmParser
1175  * \brief   Swaps the bytes so they agree with the processor order
1176  * @return  The properly swaped 16 bits integer.
1177  */
1178 guint16 gdcmParser::SwapShort(guint16 a) {
1179    if ( (sw==4321)  || (sw==2143) )
1180       a =(((a<<8) & 0x0ff00) | ((a>>8)&0x00ff));
1181    return (a);
1182 }
1183
1184 /**
1185  * \ingroup gdcmParser
1186  * \brief   Unswaps the bytes so they agree with the processor order
1187  * @return  The properly unswaped 16 bits integer.
1188  */
1189 guint16 gdcmParser::UnswapShort(guint16 a) {
1190    return (SwapShort(a));
1191 }
1192
1193 //-----------------------------------------------------------------------------
1194 // Private
1195 /**
1196  * \ingroup gdcmParser
1197  * \brief   Parses the header of the file but WITHOUT loading element values.
1198  * @return  false if file is not ACR-NEMA / DICOM
1199  */
1200 bool gdcmParser::ParseHeader(bool exception_on_error) throw(gdcmFormatError) {
1201
1202    rewind(fp);
1203    if (!CheckSwap())
1204       return false;
1205
1206    gdcmHeaderEntry *newHeaderEntry = (gdcmHeaderEntry *)0;
1207    while ( (newHeaderEntry = ReadNextHeaderEntry()) ) {
1208      SkipHeaderEntry(newHeaderEntry);
1209      if ( (ignoreShadow==0) || (newHeaderEntry->GetGroup()%2) == 0) {
1210         AddHeaderEntry(newHeaderEntry);
1211      }
1212    }
1213    return true;
1214 }
1215
1216 /**
1217  * \ingroup gdcmParser
1218  * \brief   Loads the element values of all the Header Entries pointed in the
1219  *          public Chained List.
1220  */
1221 void gdcmParser::LoadHeaderEntries(void) {
1222    rewind(fp);
1223    for (ListTag::iterator i = GetListEntry().begin();
1224       i != GetListEntry().end();
1225       ++i)
1226    {
1227       LoadHeaderEntry(*i);
1228    }
1229
1230    rewind(fp);
1231
1232    // Load 'non string' values
1233    std::string PhotometricInterpretation = GetEntryByNumber(0x0028,0x0004);
1234    if( PhotometricInterpretation == "PALETTE COLOR " ) {
1235       LoadEntryVoidArea(0x0028,0x1200);  // gray LUT
1236       LoadEntryVoidArea(0x0028,0x1201);  // R    LUT
1237       LoadEntryVoidArea(0x0028,0x1202);  // G    LUT
1238       LoadEntryVoidArea(0x0028,0x1203);  // B    LUT
1239
1240       LoadEntryVoidArea(0x0028,0x1221);  // Segmented Red   Palette Color LUT Data
1241       LoadEntryVoidArea(0x0028,0x1222);  // Segmented Green Palette Color LUT Data
1242       LoadEntryVoidArea(0x0028,0x1223);  // Segmented Blue  Palette Color LUT Data
1243    }
1244
1245    // --------------------------------------------------------------
1246    // Special Patch to allow gdcm to read ACR-LibIDO formated images
1247    //
1248    // if recognition code tells us we deal with a LibIDO image
1249    // we switch lineNumber and columnNumber
1250    //
1251    std::string RecCode;
1252    RecCode = GetEntryByNumber(0x0008, 0x0010); // recognition code
1253    if (RecCode == "ACRNEMA_LIBIDO_1.1" ||
1254        RecCode == "CANRME_AILIBOD1_1." )
1255    {
1256          filetype = ACR_LIBIDO;
1257          std::string rows    = GetEntryByNumber(0x0028, 0x0010);
1258          std::string columns = GetEntryByNumber(0x0028, 0x0011);
1259          SetEntryByNumber(columns, 0x0028, 0x0010);
1260          SetEntryByNumber(rows   , 0x0028, 0x0011);
1261    }
1262    // ----------------- End of Special Patch ----------------
1263 }
1264
1265 /**
1266  * \ingroup       gdcmParser
1267  * \brief         Loads the element content if its length doesn't exceed
1268  *                the value specified with gdcmParser::SetMaxSizeLoadEntry()
1269  * @param         Entry Header Entry (Dicom Element) to be dealt with
1270  */
1271 void gdcmParser::LoadHeaderEntry(gdcmHeaderEntry *Entry)  {
1272    size_t item_read;
1273    guint16 group  = Entry->GetGroup();
1274    std::string  vr= Entry->GetVR();
1275    guint32 length = Entry->GetLength();
1276    bool SkipLoad  = false;
1277
1278    fseek(fp, (long)Entry->GetOffset(), SEEK_SET);
1279
1280    // the test was commented out to 'go inside' the SeQuences
1281    // we don't any longer skip them !
1282
1283    // if( vr == "SQ" )  //  (DO NOT remove this comment)
1284    //    SkipLoad = true;
1285
1286    // A SeQuence "contains" a set of Elements.
1287    //          (fffe e000) tells us an Element is beginning
1288    //          (fffe e00d) tells us an Element just ended
1289    //          (fffe e0dd) tells us the current SeQuence just ended
1290    if( group == 0xfffe )
1291       SkipLoad = true;
1292
1293    if ( SkipLoad ) {
1294       Entry->SetLength(0);
1295       Entry->SetValue("gdcm::Skipped");
1296       return;
1297    }
1298
1299    // When the length is zero things are easy:
1300    if ( length == 0 ) {
1301       Entry->SetValue("");
1302       return;
1303    }
1304
1305    // The elements whose length is bigger than the specified upper bound
1306    // are not loaded. Instead we leave a short notice of the offset of
1307    // the element content and it's length.
1308    if (length > MaxSizeLoadEntry) {
1309       std::ostringstream s;
1310       s << "gdcm::NotLoaded.";
1311       s << " Address:" << (long)Entry->GetOffset();
1312       s << " Length:"  << Entry->GetLength();
1313       s << " x(" << std::hex << Entry->GetLength() << ")";
1314       Entry->SetValue(s.str());
1315       return;
1316    }
1317
1318    // When integer(s) are expected, read and convert the following
1319    // n *(two or four bytes)
1320    // properly i.e. as integers as opposed to strings.
1321    // Elements with Value Multiplicity > 1
1322    // contain a set of integers (not a single one)
1323
1324    // Any compacter code suggested (?)
1325    if ( IsHeaderEntryAnInteger(Entry) ) {
1326       guint32 NewInt;
1327       std::ostringstream s;
1328       int nbInt;
1329       if (vr == "US" || vr == "SS") {
1330          nbInt = length / 2;
1331          NewInt = ReadInt16();
1332          s << NewInt;
1333          if (nbInt > 1){
1334             for (int i=1; i < nbInt; i++) {
1335                s << '\\';
1336                NewInt = ReadInt16();
1337                s << NewInt;
1338             }
1339          }
1340       }
1341       else if (vr == "UL" || vr == "SL") {
1342          nbInt = length / 4;
1343          NewInt = ReadInt32();
1344          s << NewInt;
1345          if (nbInt > 1) {
1346             for (int i=1; i < nbInt; i++) {
1347                s << '\\';
1348                NewInt = ReadInt32();
1349                s << NewInt;
1350             }
1351          }
1352       }
1353 #ifdef GDCM_NO_ANSI_STRING_STREAM
1354       s << std::ends; // to avoid oddities on Solaris
1355 #endif //GDCM_NO_ANSI_STRING_STREAM
1356
1357       Entry->SetValue(s.str());
1358       return;
1359    }
1360
1361    // We need an additional byte for storing \0 that is not on disk
1362    std::string NewValue(length,0);
1363    item_read = fread(&(NewValue[0]), (size_t)length, (size_t)1, fp);
1364    if ( item_read != 1 ) {
1365       dbg.Verbose(1, "gdcmParser::LoadElementValue","unread element value");
1366       Entry->SetValue("gdcm::UnRead");
1367       return;
1368    }
1369
1370    if( (vr == "UI") ) // Because of correspondance with the VR dic
1371       Entry->SetValue(NewValue.c_str()); // ??? JPR ???
1372    else
1373       Entry->SetValue(NewValue);
1374 }
1375
1376 /**
1377  * \ingroup gdcmParser
1378  * \brief   add a new Dicom Element pointer to
1379  *          the H Table and to the chained List
1380  * \warning push_bash in listEntries ONLY during ParseHeader
1381  * \TODO    something to allow further Elements addition,
1382  * \        when position to be taken care of
1383  * @param   newHeaderEntry
1384  */
1385 void gdcmParser::AddHeaderEntry(gdcmHeaderEntry *newHeaderEntry) {
1386    tagHT.insert( PairHT( newHeaderEntry->GetKey(),newHeaderEntry) );
1387    listEntries.push_back(newHeaderEntry);
1388    wasUpdated = 1;
1389 }
1390
1391 /**
1392  * \ingroup gdcmParser
1393  * \brief
1394  * @param   Entry Header Entry whose length of the value shall be loaded.
1395
1396  * @return
1397  */
1398  void gdcmParser::FindHeaderEntryLength (gdcmHeaderEntry *Entry) {
1399    guint16 element = Entry->GetElement();
1400    guint16 group   = Entry->GetGroup();
1401    std::string  vr = Entry->GetVR();
1402    guint16 length16;
1403    if( (element == NumPixel) && (group == GrPixel) )
1404    {
1405       dbg.SetDebug(-1);
1406       dbg.Verbose(2, "gdcmParser::FindLength: ",
1407                      "we reached (GrPixel,NumPixel)");
1408    }
1409
1410    if ( (filetype == ExplicitVR) && (! Entry->IsImplicitVR()) )
1411    {
1412       if ( (vr=="OB") || (vr=="OW") || (vr=="SQ") || (vr=="UN") )
1413       {
1414          // The following reserved two bytes (see PS 3.5-2001, section
1415          // 7.1.2 Data element structure with explicit vr p27) must be
1416          // skipped before proceeding on reading the length on 4 bytes.
1417          fseek(fp, 2L, SEEK_CUR);
1418          guint32 length32 = ReadInt32();
1419
1420          if ( (vr == "OB") && (length32 == 0xffffffff) )
1421          {
1422             Entry->SetLength(FindHeaderEntryLengthOB());
1423             return;
1424          }
1425          FixHeaderEntryFoundLength(Entry, length32);
1426          return;
1427       }
1428
1429       // Length is encoded on 2 bytes.
1430       length16 = ReadInt16();
1431
1432       // We can tell the current file is encoded in big endian (like
1433       // Data/US-RGB-8-epicard) when we find the "Transfer Syntax" tag
1434       // and it's value is the one of the encoding of a big endian file.
1435       // In order to deal with such big endian encoded files, we have
1436       // (at least) two strategies:
1437       // * when we load the "Transfer Syntax" tag with value of big endian
1438       //   encoding, we raise the proper flags. Then we wait for the end
1439       //   of the META group (0x0002) among which is "Transfer Syntax",
1440       //   before switching the swap code to big endian. We have to postpone
1441       //   the switching of the swap code since the META group is fully encoded
1442       //   in little endian, and big endian coding only starts at the next
1443       //   group. The corresponding code can be hard to analyse and adds
1444       //   many additional unnecessary tests for regular tags.
1445       // * the second strategy consists in waiting for trouble, that shall
1446       //   appear when we find the first group with big endian encoding. This
1447       //   is easy to detect since the length of a "Group Length" tag (the
1448       //   ones with zero as element number) has to be of 4 (0x0004). When we
1449       //   encounter 1024 (0x0400) chances are the encoding changed and we
1450       //   found a group with big endian encoding.
1451       // We shall use this second strategy. In order to make sure that we
1452       // can interpret the presence of an apparently big endian encoded
1453       // length of a "Group Length" without committing a big mistake, we
1454       // add an additional check: we look in the already parsed elements
1455       // for the presence of a "Transfer Syntax" whose value has to be "big
1456       // endian encoding". When this is the case, chances are we have got our
1457       // hands on a big endian encoded file: we switch the swap code to
1458       // big endian and proceed...
1459       if ( (element  == 0x0000) && (length16 == 0x0400) )
1460       {
1461          if ( ! IsExplicitVRBigEndianTransferSyntax() )
1462          {
1463             dbg.Verbose(0, "gdcmParser::FindLength", "not explicit VR");
1464             errno = 1;
1465             return;
1466          }
1467          length16 = 4;
1468          SwitchSwapToBigEndian();
1469          // Restore the unproperly loaded values i.e. the group, the element
1470          // and the dictionary entry depending on them.
1471          guint16 CorrectGroup   = SwapShort(Entry->GetGroup());
1472          guint16 CorrectElem    = SwapShort(Entry->GetElement());
1473          gdcmDictEntry * NewTag = GetDictEntryByNumber(CorrectGroup,
1474                                                        CorrectElem);
1475          if (!NewTag)
1476          {
1477             // This correct tag is not in the dictionary. Create a new one.
1478             NewTag = NewVirtualDictEntry(CorrectGroup, CorrectElem);
1479          }
1480          // FIXME this can create a memory leaks on the old entry that be
1481          // left unreferenced.
1482          Entry->SetDictEntry(NewTag);
1483       }
1484
1485       // Heuristic: well some files are really ill-formed.
1486       if ( length16 == 0xffff)
1487       {
1488          length16 = 0;
1489          //dbg.Verbose(0, "gdcmParser::FindLength",
1490          //            "Erroneous element length fixed.");
1491          // Actually, length= 0xffff means that we deal with
1492          // Unknown Sequence Length
1493       }
1494
1495       FixHeaderEntryFoundLength(Entry, (guint32)length16);
1496       return;
1497    }
1498    else
1499    {
1500       // Either implicit VR or a non DICOM conformal (see not below) explicit
1501       // VR that ommited the VR of (at least) this element. Farts happen.
1502       // [Note: according to the part 5, PS 3.5-2001, section 7.1 p25
1503       // on Data elements "Implicit and Explicit VR Data Elements shall
1504       // not coexist in a Data Set and Data Sets nested within it".]
1505       // Length is on 4 bytes.
1506       FixHeaderEntryFoundLength(Entry, ReadInt32());
1507       return;
1508    }
1509 }
1510
1511 /**
1512  * \ingroup   gdcmParser
1513  * \brief     Find the Value Representation of the current Dicom Element.
1514  * @param     Entry
1515  */
1516 void gdcmParser::FindHeaderEntryVR( gdcmHeaderEntry *Entry)
1517 {
1518    if (filetype != ExplicitVR)
1519       return;
1520
1521    char VR[3];
1522    int lgrLue;
1523
1524    long PositionOnEntry = ftell(fp);
1525    // Warning: we believe this is explicit VR (Value Representation) because
1526    // we used a heuristic that found "UL" in the first tag. Alas this
1527    // doesn't guarantee that all the tags will be in explicit VR. In some
1528    // cases (see e-film filtered files) one finds implicit VR tags mixed
1529    // within an explicit VR file. Hence we make sure the present tag
1530    // is in explicit VR and try to fix things if it happens not to be
1531    // the case.
1532
1533    lgrLue=fread (&VR, (size_t)2,(size_t)1, fp);
1534    VR[2]=0;
1535    if(!CheckHeaderEntryVR(Entry,VR))
1536    {
1537       fseek(fp, PositionOnEntry, SEEK_SET);
1538       // When this element is known in the dictionary we shall use, e.g. for
1539       // the semantics (see the usage of IsAnInteger), the VR proposed by the
1540       // dictionary entry. Still we have to flag the element as implicit since
1541       // we know now our assumption on expliciteness is not furfilled.
1542       // avoid  .
1543       if ( Entry->IsVRUnknown() )
1544          Entry->SetVR("Implicit");
1545       Entry->SetImplicitVR();
1546    }
1547 }
1548
1549 /**
1550  * \ingroup   gdcmParser
1551  * \brief     Check the correspondance between the VR of the header entry
1552  *            and the taken VR. If they are different, the header entry is
1553  *            updated with the new VR.
1554  * @param     Entry
1555  * @param     VR
1556  * @return    false if the VR is incorrect of if the VR isn't referenced
1557  *            otherwise, it returns true
1558 */
1559 bool gdcmParser::CheckHeaderEntryVR(gdcmHeaderEntry *Entry, VRKey vr)
1560 {
1561    char msg[100]; // for sprintf
1562    bool RealExplicit = true;
1563
1564    // Assume we are reading a falsely explicit VR file i.e. we reached
1565    // a tag where we expect reading a VR but are in fact we read the
1566    // first to bytes of the length. Then we will interogate (through find)
1567    // the dicom_vr dictionary with oddities like "\004\0" which crashes
1568    // both GCC and VC++ implementations of the STL map. Hence when the
1569    // expected VR read happens to be non-ascii characters we consider
1570    // we hit falsely explicit VR tag.
1571
1572    if ( (!isalpha(vr[0])) && (!isalpha(vr[1])) )
1573       RealExplicit = false;
1574
1575    // CLEANME searching the dicom_vr at each occurence is expensive.
1576    // PostPone this test in an optional integrity check at the end
1577    // of parsing or only in debug mode.
1578    if ( RealExplicit && !gdcmGlobal::GetVR()->Count(vr) )
1579       RealExplicit= false;
1580
1581    if ( !RealExplicit )
1582    {
1583       // We thought this was explicit VR, but we end up with an
1584       // implicit VR tag. Let's backtrack.
1585       sprintf(msg,"Falsely explicit vr file (%04x,%04x)\n",
1586                    Entry->GetGroup(),Entry->GetElement());
1587       dbg.Verbose(1, "gdcmParser::FindVR: ",msg);
1588
1589       return(false);
1590    }
1591
1592    if ( Entry->IsVRUnknown() )
1593    {
1594       // When not a dictionary entry, we can safely overwrite the VR.
1595       Entry->SetVR(vr);
1596    }
1597    else if ( Entry->GetVR() != vr )
1598    {
1599       // The VR present in the file and the dictionary disagree. We assume
1600       // the file writer knew best and use the VR of the file. Since it would
1601       // be unwise to overwrite the VR of a dictionary (since it would
1602       // compromise it's next user), we need to clone the actual DictEntry
1603       // and change the VR for the read one.
1604       gdcmDictEntry* NewEntry = NewVirtualDictEntry(
1605                                  Entry->GetGroup(),Entry->GetElement(),
1606                                  vr,"FIXME",Entry->GetName());
1607       Entry->SetDictEntry(NewEntry);
1608    }
1609    return(true);
1610 }
1611
1612 /**
1613  * \ingroup gdcmParser
1614  * \brief   Get the transformed value of the header entry. The VR value
1615  *          is used to define the transformation to operate on the value
1616  * \warning NOT end user intended method !
1617  * @param   Entry
1618  * @return  Transformed entry value
1619  */
1620 std::string gdcmParser::GetHeaderEntryValue(gdcmHeaderEntry *Entry)
1621 {
1622    if ( (IsHeaderEntryAnInteger(Entry)) && (Entry->IsImplicitVR()) )
1623    {
1624       std::string val=Entry->GetValue();
1625       std::string vr=Entry->GetVR();
1626       guint32 length = Entry->GetLength();
1627       std::ostringstream s;
1628       int nbInt;
1629
1630       if (vr == "US" || vr == "SS")
1631       {
1632          guint16 NewInt16;
1633
1634          nbInt = length / 2;
1635          for (int i=0; i < nbInt; i++)
1636          {
1637             if(i!=0)
1638                s << '\\';
1639             NewInt16 = (val[2*i+0]&0xFF)+((val[2*i+1]&0xFF)<<8);
1640             NewInt16 = SwapShort(NewInt16);
1641             s << NewInt16;
1642          }
1643       }
1644
1645       else if (vr == "UL" || vr == "SL")
1646       {
1647          guint32 NewInt32;
1648
1649          nbInt = length / 4;
1650          for (int i=0; i < nbInt; i++)
1651          {
1652             if(i!=0)
1653                s << '\\';
1654             NewInt32= (val[4*i+0]&0xFF)+((val[4*i+1]&0xFF)<<8)+
1655                      ((val[4*i+2]&0xFF)<<16)+((val[4*i+3]&0xFF)<<24);
1656             NewInt32=SwapLong(NewInt32);
1657             s << NewInt32;
1658          }
1659       }
1660
1661 #ifdef GDCM_NO_ANSI_STRING_STREAM
1662       s << std::ends; // to avoid oddities on Solaris
1663 #endif //GDCM_NO_ANSI_STRING_STREAM
1664       return(s.str());
1665    }
1666
1667    return(Entry->GetValue());
1668 }
1669
1670 /**
1671  * \ingroup gdcmParser
1672  * \brief   Get the reverse transformed value of the header entry. The VR
1673  *          value is used to define the reverse transformation to operate on
1674  *          the value
1675  * \warning NOT end user intended method !
1676  * @param   Entry
1677  * @return  Reverse transformed entry value
1678  */
1679 std::string gdcmParser::GetHeaderEntryUnvalue(gdcmHeaderEntry *Entry)
1680 {
1681    if ( (IsHeaderEntryAnInteger(Entry)) && (Entry->IsImplicitVR()) )
1682    {
1683       std::string vr=Entry->GetVR();
1684       std::ostringstream s;
1685       std::vector<std::string> tokens;
1686
1687       if (vr == "US" || vr == "SS")
1688       {
1689          guint16 NewInt16;
1690
1691          tokens.erase(tokens.begin(),tokens.end()); // clean any previous value
1692          Tokenize (Entry->GetValue(), tokens, "\\");
1693          for (unsigned int i=0; i<tokens.size();i++)
1694          {
1695             NewInt16 = atoi(tokens[i].c_str());
1696             s<<(NewInt16&0xFF)<<((NewInt16>>8)&0xFF);
1697          }
1698          tokens.clear();
1699       }
1700       if (vr == "UL" || vr == "SL")
1701       {
1702          guint32 NewInt32;
1703
1704          tokens.erase(tokens.begin(),tokens.end()); // clean any previous value
1705          Tokenize (Entry->GetValue(), tokens, "\\");
1706          for (unsigned int i=0; i<tokens.size();i++)
1707          {
1708             NewInt32 = atoi(tokens[i].c_str());
1709             s<<(char)(NewInt32&0xFF)<<(char)((NewInt32>>8)&0xFF)
1710                <<(char)((NewInt32>>16)&0xFF)<<(char)((NewInt32>>24)&0xFF);
1711          }
1712          tokens.clear();
1713       }
1714
1715 #ifdef GDCM_NO_ANSI_STRING_STREAM
1716       s << std::ends; // to avoid oddities on Solaris
1717 #endif //GDCM_NO_ANSI_STRING_STREAM
1718       return(s.str());
1719    }
1720
1721    return(Entry->GetValue());
1722 }
1723
1724 /**
1725  * \ingroup gdcmParser
1726  * \brief   Skip a given Header Entry
1727  * \warning NOT end user intended method !
1728  * @param   entry
1729  */
1730 void gdcmParser::SkipHeaderEntry(gdcmHeaderEntry *entry)
1731 {
1732     SkipBytes(entry->GetLength());
1733 }
1734
1735 /**
1736  * \ingroup gdcmParser
1737  * \brief   When the length of an element value is obviously wrong (because
1738  *          the parser went Jabberwocky) one can hope improving things by
1739  *          applying this heuristic.
1740  */
1741 void gdcmParser::FixHeaderEntryFoundLength(gdcmHeaderEntry *Entry, guint32 FoundLength)
1742 {
1743    Entry->SetReadLength(FoundLength); // will be updated only if a bug is found
1744
1745    if ( FoundLength == 0xffffffff) {
1746       FoundLength = 0;
1747    }
1748
1749    guint16 gr =Entry->GetGroup();
1750    guint16 el =Entry->GetElement();
1751
1752    if (FoundLength%2) {
1753       std::cout << "Warning : Tag with uneven length " << FoundLength
1754          <<  "in x(" << std::hex << gr << "," << el <<")" << std::endl;
1755    }
1756
1757    // Sorry for the patch!
1758    // XMedCom did the trick to read some nasty GE images ...
1759    if (FoundLength == 13) {
1760       // The following 'if' will be removed when there is no more
1761       // images on Creatis HDs with a 13 length for Manufacturer...
1762       if ( (Entry->GetGroup() != 0x0008) ||
1763            ( (Entry->GetElement() != 0x0070) && (Entry->GetElement() != 0x0080) ) ){
1764       // end of remove area
1765          FoundLength =10;
1766          Entry->SetReadLength(10); // a bug is to be fixed
1767       }
1768    }
1769
1770    // to fix some garbage 'Leonardo' Siemens images
1771    // May be commented out to avoid overhead
1772    else if ( (Entry->GetGroup() == 0x0009) &&
1773        ( (Entry->GetElement() == 0x1113) || (Entry->GetElement() == 0x1114) ) ){
1774       FoundLength =4;
1775       Entry->SetReadLength(4); // a bug is to be fixed
1776    }
1777    // end of fix
1778
1779    // to try to 'go inside' SeQuences (with length), and not to skip them
1780    else if ( Entry->GetVR() == "SQ")
1781    {
1782       if (enableSequences)    // only if the user does want to !
1783          FoundLength =0;      // ReadLength is unchanged
1784    }
1785
1786    // a SeQuence Element is beginning
1787    // Let's forget it's length
1788    // (we want to 'go inside')
1789
1790    // Pb : *normaly*  fffe|e000 is just a marker, its length *should be* zero
1791    // in gdcm-MR-PHILIPS-16-Multi-Seq.dcm we find lengthes as big as 28800
1792    // if we set the length to zero IsHeaderEntryAnInteger() breaks...
1793    // if we don't, we lost 28800 characters from the Header :-(
1794
1795    else if(Entry->GetGroup() == 0xfffe)
1796    {
1797                        // sometimes, length seems to be wrong
1798       FoundLength =0;  // some more clever checking to be done !
1799                        // I give up!
1800                        // only  gdcm-MR-PHILIPS-16-Multi-Seq.dcm
1801                        // causes troubles :-(
1802    }
1803
1804    Entry->SetUsableLength(FoundLength);
1805 }
1806
1807 /**
1808  * \ingroup gdcmParser
1809  * \brief   Apply some heuristics to predict wether the considered
1810  *          element value contains/represents an integer or not.
1811  * @param   Entry The element value on which to apply the predicate.
1812  * @return  The result of the heuristical predicate.
1813  */
1814 bool gdcmParser::IsHeaderEntryAnInteger(gdcmHeaderEntry *Entry) {
1815    guint16 element = Entry->GetElement();
1816    guint16 group   = Entry->GetGroup();
1817    std::string  vr = Entry->GetVR();
1818    guint32 length  = Entry->GetLength();
1819    // When we have some semantics on the element we just read, and if we
1820    // a priori know we are dealing with an integer, then we shall be
1821    // able to swap it's element value properly.
1822    if ( element == 0 )  // This is the group length of the group
1823    {
1824       if (length == 4)
1825          return true;
1826       else
1827       {
1828          std::ostringstream s;
1829          int filePosition = ftell(fp);
1830          s << "Erroneous Group Length element length  on : (" \
1831            << std::hex << group << " , " << element
1832            << ") -before- position x(" << filePosition << ")"
1833            << "lgt : " << length;
1834         // These 2 lines commented out : a *very dirty* patch
1835         // to go on PrintHeader'ing gdcm-MR-PHILIPS-16-Multi-Seq.dcm.
1836         // have a glance at offset  x(8336) ...
1837         // For *regular* headers, the test is useless..
1838         // lets's print a warning message and go on,
1839         // instead of giving up with an error message
1840
1841         //std::cout << s.str().c_str() << std::endl;
1842
1843         // dbg.Error("gdcmParser::IsHeaderEntryAnInteger",
1844         //    s.str().c_str());
1845       }
1846    }
1847    if ( (vr == "UL") || (vr == "US") || (vr == "SL") || (vr == "SS") )
1848       return true;
1849
1850    return false;
1851 }
1852
1853 /**
1854  * \ingroup gdcmParser
1855  * \brief
1856  *
1857  * @return
1858  */
1859  guint32 gdcmParser::FindHeaderEntryLengthOB(void)  {
1860    // See PS 3.5-2001, section A.4 p. 49 on encapsulation of encoded pixel data.
1861    guint16 g;
1862    guint16 n;
1863    long PositionOnEntry = ftell(fp);
1864    bool FoundSequenceDelimiter = false;
1865    guint32 TotalLength = 0;
1866    guint32 ItemLength;
1867
1868    while ( ! FoundSequenceDelimiter)
1869    {
1870       g = ReadInt16();
1871       n = ReadInt16();
1872       if (errno == 1)
1873          return 0;
1874       TotalLength += 4;  // We even have to decount the group and element
1875
1876       if ( g != 0xfffe && g!=0xb00c ) /*for bogus header */
1877       {
1878          char msg[100]; // for sprintf. Sorry
1879          sprintf(msg,"wrong group (%04x) for an item sequence (%04x,%04x)\n",g, g,n);
1880          dbg.Verbose(1, "gdcmParser::FindLengthOB: ",msg);
1881          errno = 1;
1882          return 0;
1883       }
1884       if ( n == 0xe0dd || ( g==0xb00c && n==0x0eb6 ) ) /* for bogus header  */
1885          FoundSequenceDelimiter = true;
1886       else if ( n != 0xe000 )
1887       {
1888          char msg[100];  // for sprintf. Sorry
1889          sprintf(msg,"wrong element (%04x) for an item sequence (%04x,%04x)\n",
1890                       n, g,n);
1891          dbg.Verbose(1, "gdcmParser::FindLengthOB: ",msg);
1892          errno = 1;
1893          return 0;
1894       }
1895       ItemLength = ReadInt32();
1896       TotalLength += ItemLength + 4;  // We add 4 bytes since we just read
1897                                       // the ItemLength with ReadInt32
1898       SkipBytes(ItemLength);
1899    }
1900    fseek(fp, PositionOnEntry, SEEK_SET);
1901    return TotalLength;
1902 }
1903
1904 /**
1905  * \ingroup gdcmParser
1906  * \brief Reads a supposed to be 16 Bits integer
1907  * \     (swaps it depending on processor endianity)
1908  *
1909  * @return read value
1910  */
1911 guint16 gdcmParser::ReadInt16(void) {
1912    guint16 g;
1913    size_t item_read;
1914    item_read = fread (&g, (size_t)2,(size_t)1, fp);
1915    if ( item_read != 1 ) {
1916       if(ferror(fp))
1917          dbg.Verbose(0, "gdcmParser::ReadInt16", " File Error");
1918       errno = 1;
1919       return 0;
1920    }
1921    errno = 0;
1922    g = SwapShort(g);
1923    return g;
1924 }
1925
1926 /**
1927  * \ingroup gdcmParser
1928  * \brief  Reads a supposed to be 32 Bits integer
1929  * \       (swaps it depending on processor endianity)
1930  *
1931  * @return read value
1932  */
1933 guint32 gdcmParser::ReadInt32(void) {
1934    guint32 g;
1935    size_t item_read;
1936    item_read = fread (&g, (size_t)4,(size_t)1, fp);
1937    if ( item_read != 1 ) {
1938      if(ferror(fp))
1939          dbg.Verbose(0, "gdcmParser::ReadInt32", " File Error");
1940       errno = 1;
1941       return 0;
1942    }
1943    errno = 0;
1944    g = SwapLong(g);
1945    return g;
1946 }
1947
1948 /**
1949  * \ingroup gdcmParser
1950  * \brief
1951  *
1952  * @return
1953  */
1954 void gdcmParser::SkipBytes(guint32 NBytes) {
1955    //FIXME don't dump the returned value
1956    (void)fseek(fp, (long)NBytes, SEEK_CUR);
1957 }
1958
1959 /**
1960  * \ingroup gdcmParser
1961  * \brief
1962  */
1963 void gdcmParser::Initialise(void)
1964 {
1965    RefPubDict = gdcmGlobal::GetDicts()->GetDefaultPubDict();
1966    RefShaDict = (gdcmDict*)0;
1967 }
1968
1969 /**
1970  * \ingroup gdcmParser
1971  * \brief   Discover what the swap code is (among little endian, big endian,
1972  *          bad little endian, bad big endian).
1973  *          sw is set
1974  * @return false when we are absolutely sure
1975  *               it's neither ACR-NEMA nor DICOM
1976  *         true  when we hope ours assuptions are OK
1977  */
1978 bool gdcmParser::CheckSwap() {
1979
1980    // The only guaranted way of finding the swap code is to find a
1981    // group tag since we know it's length has to be of four bytes i.e.
1982    // 0x00000004. Finding the swap code in then straigthforward. Trouble
1983    // occurs when we can't find such group...
1984
1985    guint32  x=4;  // x : for ntohs
1986    bool net2host; // true when HostByteOrder is the same as NetworkByteOrder
1987    guint32  s32;
1988    guint16  s16;
1989
1990    int lgrLue;
1991    char *entCur;
1992    char deb[HEADER_LENGTH_TO_READ];
1993
1994    // First, compare HostByteOrder and NetworkByteOrder in order to
1995    // determine if we shall need to swap bytes (i.e. the Endian type).
1996    if (x==ntohs(x))
1997       net2host = true;
1998    else
1999       net2host = false;
2000
2001    // The easiest case is the one of a DICOM header, since it possesses a
2002    // file preamble where it suffice to look for the string "DICM".
2003    lgrLue = fread(deb, 1, HEADER_LENGTH_TO_READ, fp);
2004
2005    entCur = deb + 128;
2006    if(memcmp(entCur, "DICM", (size_t)4) == 0) {
2007       dbg.Verbose(1, "gdcmParser::CheckSwap:", "looks like DICOM Version3");
2008
2009       // Next, determine the value representation (VR). Let's skip to the
2010       // first element (0002, 0000) and check there if we find "UL"
2011       // - or "OB" if the 1st one is (0002,0001) -,
2012       // in which case we (almost) know it is explicit VR.
2013       // WARNING: if it happens to be implicit VR then what we will read
2014       // is the length of the group. If this ascii representation of this
2015       // length happens to be "UL" then we shall believe it is explicit VR.
2016       // FIXME: in order to fix the above warning, we could read the next
2017       // element value (or a couple of elements values) in order to make
2018       // sure we are not commiting a big mistake.
2019       // We need to skip :
2020       // * the 128 bytes of File Preamble (often padded with zeroes),
2021       // * the 4 bytes of "DICM" string,
2022       // * the 4 bytes of the first tag (0002, 0000),or (0002, 0001)
2023       // i.e. a total of  136 bytes.
2024       entCur = deb + 136;
2025       // FIXME
2026       // Use gdcmParser::dicom_vr to test all the possibilities
2027       // instead of just checking for UL, OB and UI !?
2028
2029       // FIXME : FIXME:
2030       // Sometimes (see : gdcmData/icone.dcm) group 0x0002 *is* Explicit VR,
2031       // but elem 0002,0010 (Transfert Syntax) tells us the file is *Implicit* VR.
2032       // -and it is !-
2033
2034       // The following test is *absolutely useless*, since everything *goes right*
2035       // with a *100 % wrong* assumption !!!
2036
2037       if( (memcmp(entCur, "UL", (size_t)2) == 0) ||
2038           (memcmp(entCur, "OB", (size_t)2) == 0) ||
2039           (memcmp(entCur, "UI", (size_t)2) == 0) ||
2040           (memcmp(entCur, "CS", (size_t)2) == 0) )  // CS, to remove later
2041                                                     // when Write DCM *adds*
2042                                                     // group 0000
2043       {
2044          filetype = ExplicitVR;
2045          dbg.Verbose(1, "gdcmParser::CheckSwap:",
2046                      "explicit Value Representation");
2047       }
2048       else
2049       {
2050          filetype = ImplicitVR;
2051          dbg.Verbose(1, "gdcmParser::CheckSwap:",
2052                      "not an explicit Value Representation");
2053       }
2054
2055       if (net2host)
2056       {
2057          sw = 4321;
2058          dbg.Verbose(1, "gdcmParser::CheckSwap:",
2059                         "HostByteOrder != NetworkByteOrder");
2060       }
2061       else
2062       {
2063          sw = 0;
2064          dbg.Verbose(1, "gdcmParser::CheckSwap:",
2065                         "HostByteOrder = NetworkByteOrder");
2066       }
2067
2068       // Position the file position indicator at first tag (i.e.
2069       // after the file preamble and the "DICM" string).
2070       rewind(fp);
2071       fseek (fp, 132L, SEEK_SET);
2072       return true;
2073    } // End of DicomV3
2074
2075    // Alas, this is not a DicomV3 file and whatever happens there is no file
2076    // preamble. We can reset the file position indicator to where the data
2077    // is (i.e. the beginning of the file).
2078    dbg.Verbose(1, "gdcmParser::CheckSwap:", "not a DICOM Version3 file");
2079    rewind(fp);
2080
2081    // Our next best chance would be to be considering a 'clean' ACR/NEMA file.
2082    // By clean we mean that the length of the first tag is written down.
2083    // If this is the case and since the length of the first group HAS to be
2084    // four (bytes), then determining the proper swap code is straightforward.
2085
2086    entCur = deb + 4;
2087    // We assume the array of char we are considering contains the binary
2088    // representation of a 32 bits integer. Hence the following dirty
2089    // trick :
2090    s32 = *((guint32 *)(entCur));
2091
2092    switch (s32) {
2093       case 0x00040000 :
2094          sw = 3412;
2095          filetype = ACR;
2096          return true;
2097       case 0x04000000 :
2098          sw = 4321;
2099          filetype = ACR;
2100          return true;
2101       case 0x00000400 :
2102          sw = 2143;
2103          filetype = ACR;
2104          return true;
2105       case 0x00000004 :
2106          sw = 0;
2107          filetype = ACR;
2108          return true;
2109       default :
2110
2111       // We are out of luck. It is not a DicomV3 nor a 'clean' ACR/NEMA file.
2112       // It is time for despaired wild guesses.
2113       // So, let's check if this file wouldn't happen to be 'dirty' ACR/NEMA,
2114       //  i.e. the 'group length' element is not present :
2115
2116       //  check the supposed to be 'group number'
2117       //  0x0002 or 0x0004 or 0x0008
2118       //  to determine ' sw' value .
2119       //  Only 0 or 4321 will be possible
2120       //  (no oportunity to check for the formerly well known
2121       //  ACR-NEMA 'Bad Big Endian' or 'Bad Little Endian'
2122       //  if unsuccessfull (i.e. neither 0x0002 nor 0x0200 etc -4, 8-)
2123       //  the file IS NOT ACR-NEMA nor DICOM V3
2124       //  Find a trick to tell it the caller...
2125
2126       s16 = *((guint16 *)(deb));
2127
2128       switch (s16) {
2129       case 0x0002 :
2130       case 0x0004 :
2131       case 0x0008 :
2132          sw = 0;
2133          filetype = ACR;
2134          return true;
2135       case 0x0200 :
2136       case 0x0400 :
2137       case 0x0800 :
2138          sw = 4321;
2139          filetype = ACR;
2140          return true;
2141       default :
2142          dbg.Verbose(0, "gdcmParser::CheckSwap:",
2143                      "ACR/NEMA unfound swap info (Really hopeless !)");
2144          filetype = Unknown;
2145          return false;
2146       }
2147
2148       // Then the only info we have is the net2host one.
2149          //if (! net2host )
2150          //   sw = 0;
2151          //else
2152          //  sw = 4321;
2153          //return;
2154    }
2155 }
2156
2157 /**
2158  * \ingroup gdcmParser
2159  * \brief
2160  */
2161 void gdcmParser::SwitchSwapToBigEndian(void)
2162 {
2163    dbg.Verbose(1, "gdcmParser::SwitchSwapToBigEndian",
2164                   "Switching to BigEndian mode.");
2165    if ( sw == 0    )
2166    {
2167       sw = 4321;
2168       return;
2169    }
2170    if ( sw == 4321 )
2171    {
2172       sw = 0;
2173       return;
2174    }
2175    if ( sw == 3412 )
2176    {
2177       sw = 2143;
2178       return;
2179    }
2180    if ( sw == 2143 )
2181       sw = 3412;
2182 }
2183
2184 /**
2185  * \ingroup gdcmParser
2186  * \brief
2187  * @param NewSize
2188  */
2189 void gdcmParser::SetMaxSizeLoadEntry(long NewSize)
2190 {
2191    if (NewSize < 0)
2192       return;
2193    if ((guint32)NewSize >= (guint32)0xffffffff)
2194    {
2195       MaxSizeLoadEntry = 0xffffffff;
2196       return;
2197    }
2198    MaxSizeLoadEntry = NewSize;
2199 }
2200
2201
2202 /**
2203  * \ingroup gdcmParser
2204  * \brief
2205  * \warning TODO : not yet usable
2206  *          (see MAX_SIZE_PRINT_ELEMENT_VALUE
2207  *           in gdcmHeaderEntry gdcmLoadEntry)
2208  *
2209  * @param NewSize
2210  */
2211 void gdcmParser::SetMaxSizePrintEntry(long NewSize)
2212 {
2213    if (NewSize < 0)
2214       return;
2215    if ((guint32)NewSize >= (guint32)0xffffffff)
2216    {
2217       MaxSizePrintEntry = 0xffffffff;
2218       return;
2219    }
2220    MaxSizePrintEntry = NewSize;
2221 }
2222
2223 /**
2224  * \ingroup gdcmParser
2225  * \brief   Searches both the public and the shadow dictionary (when they
2226  *          exist) for the presence of the DictEntry with given name.
2227  *          The public dictionary has precedence on the shadow one.
2228  * @param   Name name of the searched DictEntry
2229  * @return  Corresponding DictEntry when it exists, NULL otherwise.
2230  */
2231 gdcmDictEntry *gdcmParser::GetDictEntryByName(std::string Name)
2232 {
2233    gdcmDictEntry *found = (gdcmDictEntry *)0;
2234    if (!RefPubDict && !RefShaDict)
2235    {
2236       dbg.Verbose(0, "gdcmParser::GetDictEntry",
2237                      "we SHOULD have a default dictionary");
2238    }
2239    if (RefPubDict)
2240    {
2241       found = RefPubDict->GetDictEntryByName(Name);
2242       if (found)
2243          return found;
2244    }
2245    if (RefShaDict)
2246    {
2247       found = RefShaDict->GetDictEntryByName(Name);
2248       if (found)
2249          return found;
2250    }
2251    return found;
2252 }
2253
2254 /**
2255  * \ingroup gdcmParser
2256  * \brief   Searches both the public and the shadow dictionary (when they
2257  *          exist) for the presence of the DictEntry with given
2258  *          group and element. The public dictionary has precedence on the
2259  *          shadow one.
2260  * @param   group   group of the searched DictEntry
2261  * @param   element element of the searched DictEntry
2262  * @return  Corresponding DictEntry when it exists, NULL otherwise.
2263  */
2264 gdcmDictEntry *gdcmParser::GetDictEntryByNumber(guint16 group,guint16 element)
2265 {
2266    gdcmDictEntry *found = (gdcmDictEntry *)0;
2267    if (!RefPubDict && !RefShaDict)
2268    {
2269       dbg.Verbose(0, "gdcmParser::GetDictEntry",
2270                      "we SHOULD have a default dictionary");
2271    }
2272    if (RefPubDict)
2273    {
2274       found = RefPubDict->GetDictEntryByNumber(group, element);
2275       if (found)
2276          return found;
2277    }
2278    if (RefShaDict)
2279    {
2280       found = RefShaDict->GetDictEntryByNumber(group, element);
2281       if (found)
2282          return found;
2283    }
2284    return found;
2285 }
2286
2287 /**
2288  * \ingroup gdcmParser
2289  * \brief   Read the next tag but WITHOUT loading it's value
2290  * @return  On succes the newly created HeaderEntry, NULL on failure.
2291  */
2292 gdcmHeaderEntry *gdcmParser::ReadNextHeaderEntry(void) {
2293    guint16 g,n;
2294    gdcmHeaderEntry *NewEntry;
2295
2296    g = ReadInt16();
2297    n = ReadInt16();
2298
2299    if (errno == 1)
2300       // We reached the EOF (or an error occured) therefore
2301       // header parsing has to be considered as finished.
2302       return (gdcmHeaderEntry *)0;
2303
2304 /*  Pb : how to propagate the element length (used in SkipHeaderEntry)
2305 //       direct call to SkipBytes ?
2306
2307    if (ignoreShadow == 1 && g%2 ==1)  //JPR
2308       // if user wants to skip shadow groups
2309       // and current element *is* a shadow element
2310       // we don't create anything
2311       return (gdcmHeaderEntry *)1; // to tell caller it's NOT finished
2312 */
2313    NewEntry = NewHeaderEntryByNumber(g, n);
2314    FindHeaderEntryVR(NewEntry);
2315    FindHeaderEntryLength(NewEntry);
2316
2317    if (errno == 1) {
2318       // Call it quits
2319       return NULL;
2320    }
2321    NewEntry->SetOffset(ftell(fp));
2322    return NewEntry;
2323 }
2324
2325 /**
2326  * \ingroup gdcmParser
2327  * \brief   Build a new Element Value from all the low level arguments.
2328  *          Check for existence of dictionary entry, and build
2329  *          a default one when absent.
2330  * @param   Name    Name of the underlying DictEntry
2331  */
2332 gdcmHeaderEntry *gdcmParser::NewHeaderEntryByName(std::string Name)
2333 {
2334    gdcmDictEntry *NewTag = GetDictEntryByName(Name);
2335    if (!NewTag)
2336       NewTag = NewVirtualDictEntry(0xffff, 0xffff, "LO", "Unknown", Name);
2337
2338    gdcmHeaderEntry* NewEntry = new gdcmHeaderEntry(NewTag);
2339    if (!NewEntry)
2340    {
2341       dbg.Verbose(1, "gdcmParser::ObtainHeaderEntryByName",
2342                   "failed to allocate gdcmHeaderEntry");
2343       return (gdcmHeaderEntry *)0;
2344    }
2345    return NewEntry;
2346 }
2347
2348 /**
2349  * \ingroup gdcmParser
2350  * \brief   Request a new virtual dict entry to the dict set
2351  * @param   group  group   of the underlying DictEntry
2352  * @param   elem   element of the underlying DictEntry
2353  * @param   vr     VR of the underlying DictEntry
2354  * @param   fourth owner group
2355  * @param   name   english name
2356  */
2357 gdcmDictEntry *gdcmParser::NewVirtualDictEntry(guint16 group, guint16 element,
2358                                                std::string vr,
2359                                                std::string fourth,
2360                                                std::string name)
2361 {
2362    return gdcmGlobal::GetDicts()->NewVirtualDictEntry(group,element,vr,fourth,name);
2363 }
2364
2365 /**
2366  * \ingroup gdcmParser
2367  * \brief   Build a new Element Value from all the low level arguments.
2368  *          Check for existence of dictionary entry, and build
2369  *          a default one when absent.
2370  * @param   Group group   of the underlying DictEntry
2371  * @param   Elem  element of the underlying DictEntry
2372  */
2373 gdcmHeaderEntry *gdcmParser::NewHeaderEntryByNumber(guint16 Group, guint16 Elem)
2374 {
2375    // Find out if the tag we encountered is in the dictionaries:
2376    gdcmDictEntry *DictEntry = GetDictEntryByNumber(Group, Elem);
2377    if (!DictEntry)
2378       DictEntry = NewVirtualDictEntry(Group, Elem);
2379
2380    gdcmHeaderEntry *NewEntry = new gdcmHeaderEntry(DictEntry);
2381    if (!NewEntry)
2382    {
2383       dbg.Verbose(1, "gdcmParser::NewHeaderEntryByNumber",
2384                   "failed to allocate gdcmHeaderEntry");
2385       return NULL;
2386    }
2387    return NewEntry;
2388 }
2389
2390 // Never used; commented out, waiting for removal.
2391 /**
2392  * \ingroup gdcmParser
2393  * \brief   Small utility function that creates a new manually crafted
2394  *          (as opposed as read from the file) gdcmHeaderEntry with user
2395  *          specified name and adds it to the public tag hash table.
2396  * \note    A fake TagKey is generated so the PubDict can keep it's coherence.
2397  * @param   NewTagName The name to be given to this new tag.
2398  * @param   VR The Value Representation to be given to this new tag.
2399  * @return  The newly hand crafted Element Value.
2400  */
2401 //gdcmHeaderEntry *gdcmParser::NewManualHeaderEntryToPubDict(std::string NewTagName,
2402 //                                                           std::string VR)
2403 //{
2404 //   gdcmHeaderEntry *NewEntry = NULL;
2405 //   guint32 StuffGroup = 0xffff;   // Group to be stuffed with additional info
2406 //   guint32 FreeElem = 0;
2407 //   gdcmDictEntry *DictEntry = NULL;
2408 //
2409 //   FreeElem = GenerateFreeTagKeyInGroup(StuffGroup);
2410 //   if (FreeElem == UINT32_MAX)
2411 //   {
2412 //      dbg.Verbose(1, "gdcmHeader::NewManualHeaderEntryToPubDict",
2413 //                     "Group 0xffff in Public Dict is full");
2414 //      return NULL;
2415 //   }
2416 //
2417 //   DictEntry = NewVirtualDictEntry(StuffGroup, FreeElem,
2418 //                                VR, "GDCM", NewTagName);
2419 //   NewEntry = new gdcmHeaderEntry(DictEntry);
2420 //   AddHeaderEntry(NewEntry);
2421 //   return NewEntry;
2422 //}
2423
2424 /**
2425  * \ingroup gdcmParser
2426  * \brief   Generate a free TagKey i.e. a TagKey that is not present
2427  *          in the TagHt dictionary.
2428  * @param   group The generated tag must belong to this group.
2429  * @return  The element of tag with given group which is fee.
2430  */
2431 guint32 gdcmParser::GenerateFreeTagKeyInGroup(guint16 group)
2432 {
2433    for (guint32 elem = 0; elem < UINT32_MAX; elem++)
2434    {
2435       TagKey key = gdcmDictEntry::TranslateToKey(group, elem);
2436       if (tagHT.count(key) == 0)
2437          return elem;
2438    }
2439    return UINT32_MAX;
2440 }
2441
2442 //-----------------------------------------------------------------------------