1 /*=========================================================================
4 Module: $RCSfile: gdcmDocument.h,v $
6 Date: $Date: 2005/08/29 13:05:01 $
7 Version: $Revision: 1.120 $
9 Copyright (c) CREATIS (Centre de Recherche et d'Applications en Traitement de
10 l'Image). All rights reserved. See Doc/License.txt or
11 http://www.creatis.insa-lyon.fr/Public/Gdcm/License.html for details.
13 This software is distributed WITHOUT ANY WARRANTY; without even
14 the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR
15 PURPOSE. See the above copyright notices for more information.
17 =========================================================================*/
19 #ifndef GDCMDOCUMENT_H
20 #define GDCMDOCUMENT_H
24 #include "gdcmElementSet.h"
25 #include "gdcmException.h"
31 #define NO_SEQ 0x00000001 // Don't load odd groups
32 #define NO_SHADOW 0x00000002 // Don't load Sequences
33 #define NO_SHADOWSEQ 0x00000004 // Don't load Sequences if they belong
35 // (*exclusive* from NO_SEQ and NO_SHADOW)
43 //-----------------------------------------------------------------------------
45 * \brief Derived by both gdcm::File and gdcm::DicomDir
47 class GDCM_EXPORT Document : public ElementSet
51 typedef std::list<Element> ListElements;
54 //Deprecated : use SetFileName() + Load()
55 virtual bool Load( std::string const &filename );
61 bool SetShaDict(Dict *dict);
62 bool SetShaDict(DictKey const &dictName);
64 // Informations contained in the gdcm::Document
65 virtual bool IsReadable();
68 FileType GetFileType();
69 std::string GetTransferSyntax();
70 /// Return the Transfer Syntax as a string
71 std::string GetTransferSyntaxName();
74 /// 'Swap code' accessor (see \ref SwapCode )
75 int GetSwapCode() { return SwapCode; }
76 // System access (meaning endian related !?)
77 uint16_t SwapShort(uint16_t);
78 uint32_t SwapLong(uint32_t);
79 /// \brief Unswaps back the bytes of 2-bytes long integer
80 /// so they agree with the processor order.
81 uint16_t UnswapShort(uint16_t a) { return SwapShort(a);}
82 /// \brief Unswaps back the bytes of 4-byte long integer
83 /// so they agree with the processor order.
84 uint32_t UnswapLong(uint32_t a) { return SwapLong(a);}
87 /// Accessor to \ref Filename
88 const std::string &GetFileName() const { return Filename; }
89 /// Accessor to \ref Filename
90 virtual void SetFileName(std::string const &fileName)
91 { if (Filename != fileName)
92 Filename = fileName, IsDocumentModified = true; }
94 std::ifstream *OpenFile();
96 void WriteContent( std::ofstream *fp, FileType type );
99 virtual void LoadEntryBinArea(uint16_t group, uint16_t elem);
100 virtual void LoadEntryBinArea(BinEntry *entry);
102 void LoadDocEntrySafe(DocEntry *entry);
103 void AddForceLoadElement(uint16_t group, uint16_t elem);
105 // Ordering of Documents
106 bool operator<(Document &document);
109 * \brief Sets the LoadMode as a boolean string.
110 * NO_SEQ, NO_SHADOW, NO_SHADOWSEQ
111 ... (nothing more, right now)
112 * WARNING : before using NO_SHADOW, be sure *all* your files
113 * contain accurate values in the 0x0000 element (if any)
114 * of *each* Shadow Group. The parser will fail if the size is wrong !
115 * @param mode Load mode to be used
117 void SetLoadMode (int mode) { if (LoadMode != mode)
118 LoadMode=mode, IsDocumentModified = true; }
122 // Constructor and destructor are protected to forbid end user
123 // to instanciate from this class Document (only gdcm::File and
124 // gdcm::DicomDir are meaningfull).
126 Document( std::string const &filename );
129 uint16_t ReadInt16() throw ( FormatError );
130 uint32_t ReadInt32() throw ( FormatError );
131 void SkipBytes(uint32_t);
132 int ComputeGroup0002Length( FileType filetype );
135 /// Refering underlying filename.
136 std::string Filename;
138 /// \brief Swap code gives an information on the byte order of a
139 /// supposed to be an int32, as it's read on disc
140 /// (depending on the image Transfer Syntax *and* on the processor endianess)
141 /// as opposed as it should in memory to be dealt as an int32.
143 /// - a 'Little Endian' image, read with a little endian processor
144 /// will have a SwapCode= 1234 (the order is OK; nothing to do)
145 /// - a 'Little Endian' image, read with a big endian procesor
146 /// will have a SwapCode= 4321 (the order is wrong; int32 an int16 must be
148 /// note : values 2143, 4321, 3412 remain for the ACR-NEMA time, and
149 /// the well known 'Bad Big Endian' and 'Bad Little Endian' codes
152 ///\brief whether we already parsed group 0002 (Meta Elements)
153 bool Group0002Parsed;
155 ///\brief whether file has a DCM Preamble
158 /// File Pointer, opened during Document parsing.
161 /// ACR, ACR_LIBIDO, ExplicitVR, ImplicitVR, Unknown
164 /// After opening the file, we read HEADER_LENGTH_TO_READ bytes.
165 static const unsigned int HEADER_LENGTH_TO_READ;
166 /// \brief Elements whose value is longer than MAX_SIZE_LOAD_ELEMENT_VALUE
168 static const unsigned int MAX_SIZE_LOAD_ELEMENT_VALUE;
170 /// User supplied list of elements to Anonymize
171 ListElements UserAnonymizeList;
173 /// User supplied list of elements to force Load
174 ListElements UserForceLoadList;
176 /// \brief Bit string integer (each one considered as a boolean)
177 /// Bit 0 : Skip Sequences, if possible
178 /// Bit 1 : Skip Shadow Groups if possible
179 /// Probabely, some more to add
182 /// \brief Whether the gdcm::Document is already parsed/loaded :
183 /// False from the creation of the gdcm::Document untill
184 /// gdcm::Document:Load()
185 bool IsDocumentAlreadyLoaded; // FIXME : probabely useless now
187 /// Whether the gdcm::Document was modified since the last Load()
188 bool IsDocumentModified;
193 bool DoTheLoadingDocumentJob();
195 void ParseDES(DocEntrySet *set, long offset, long l_max, bool delim_mode);
196 void ParseSQ (SeqEntry *seq, long offset, long l_max, bool delim_mode);
198 void LoadDocEntry (DocEntry *e, bool forceLoad = false);
199 void FindDocEntryLength (DocEntry *e) throw ( FormatError );
200 uint32_t FindDocEntryLengthOBOrOW() throw( FormatUnexpected );
201 std::string FindDocEntryVR();
202 bool CheckDocEntryVR (VRKey k);
204 std::string GetDocEntryValue (DocEntry *entry);
205 std::string GetDocEntryUnvalue(DocEntry *entry);
207 void SkipDocEntry (DocEntry *entry);
208 void SkipToNextDocEntry (DocEntry *entry);
210 void FixDocEntryFoundLength(DocEntry *entry, uint32_t l);
211 bool IsDocEntryAnInteger (DocEntry *entry);
214 void SwitchByteSwapCode();
215 void SetMaxSizeLoadEntry(long);
217 // DocEntry related utilities
218 DocEntry *ReadNextDocEntry();
220 void HandleBrokenEndian (uint16_t &group, uint16_t &elem);
221 void HandleOutOfGroup0002(uint16_t &group, uint16_t &elem);
222 DocEntry *Backtrack(DocEntry *docEntry);
225 /// Public dictionary used to parse this header
227 /// \brief Optional "shadow dictionary" (private elements) used to parse
231 /// \brief Size threshold above which an element value will NOT be loaded
232 /// in memory (to avoid loading the image/volume itself). By default,
233 /// this upper bound is fixed to 1024 bytes (which might look reasonable
234 /// when one considers the definition of the various VR contents).
235 uint32_t MaxSizeLoadEntry;
237 // uint32_t GenerateFreeTagKeyInGroup(uint16_t group);
238 // void BuildFlatHashTableRecurse( TagDocEntryHT &builtHT,
239 // DocEntrySet *set );
243 } // end namespace gdcm
245 //-----------------------------------------------------------------------------