001/*
002 * #%L
003 * HAPI FHIR - Core Library
004 * %%
005 * Copyright (C) 2014 - 2025 Smile CDR, Inc.
006 * %%
007 * Licensed under the Apache License, Version 2.0 (the "License");
008 * you may not use this file except in compliance with the License.
009 * You may obtain a copy of the License at
010 *
011 * http://www.apache.org/licenses/LICENSE-2.0
012 *
013 * Unless required by applicable law or agreed to in writing, software
014 * distributed under the License is distributed on an "AS IS" BASIS,
015 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
016 * See the License for the specific language governing permissions and
017 * limitations under the License.
018 * #L%
019 */
020package ca.uhn.fhir.parser;
021
022import ca.uhn.fhir.context.ConfigurationException;
023import ca.uhn.fhir.context.FhirContext;
024import ca.uhn.fhir.context.ParserOptions;
025import ca.uhn.fhir.model.api.IResource;
026import ca.uhn.fhir.rest.api.EncodingEnum;
027import ca.uhn.fhir.util.CollectionUtil;
028import jakarta.annotation.Nonnull;
029import jakarta.annotation.Nullable;
030import org.hl7.fhir.instance.model.api.IAnyResource;
031import org.hl7.fhir.instance.model.api.IBase;
032import org.hl7.fhir.instance.model.api.IBaseResource;
033import org.hl7.fhir.instance.model.api.IIdType;
034
035import java.io.IOException;
036import java.io.InputStream;
037import java.io.Reader;
038import java.io.Writer;
039import java.util.Collection;
040import java.util.List;
041import java.util.Set;
042
043/**
044 * A parser, which can be used to convert between HAPI FHIR model/structure objects, and their respective String wire
045 * formats, in either XML or JSON.
046 * <p>
047 * Thread safety: <b>Parsers are not guaranteed to be thread safe</b>. Create a new parser instance for every thread or
048 * every message being parsed/encoded.
049 * </p>
050 */
051public interface IParser {
052
053        /**
054         * Encodes a resource using the parser's given encoding format.
055         *
056         * @param theResource The resource to encode. Must not be null.
057         * @return A string representation of the encoding
058         * @throws DataFormatException If any invalid elements within the contents to be encoded prevent successful encoding.
059         */
060        String encodeResourceToString(IBaseResource theResource) throws DataFormatException;
061
062        /**
063         * Encodes a resource using the parser's given encoding format.
064         *
065         * @param theResource The resource to encode. Must not be null.
066         * @param theWriter   The writer to write to.
067         * @throws DataFormatException If any invalid elements within the contents to be encoded prevent successful encoding.
068         */
069        void encodeResourceToWriter(IBaseResource theResource, Writer theWriter) throws IOException, DataFormatException;
070
071        /**
072         * Encodes any FHIR element to a string.
073         * If a {@link IBaseResource resource object} is passed in, the resource will be encoded using standard FHIR
074         * encoding rules. If a {@link org.hl7.fhir.instance.model.api.IPrimitiveType primitive datatype} is passed in,
075         * the string value of the primitive type is encoded. Any extensions on the primitive type are not encoded.
076         * If any other object is passed in, a fragment is encoded. The format of the fragment depends on the encoding:
077         * <ul>
078         *    <li><b>JSON</b>: The fragment is output as a simple JSON object, exactly as it would appear within an encoded resource.</li>
079         *    <li><b>XML</b>: The fragment is output as an XML element as it would appear within an encoded resource, however it is wrapped in an element called <code>&lt;element&gt;</code> in order to avoid producing a document with multiple root tags.</li>
080         *    <li><b>RDF/Turtle</b>: This mode is not supported and will throw an {@link ca.uhn.fhir.rest.server.exceptions.InternalErrorException}</li>
081         * </ul>
082         *
083         * @since 6.8.0
084         */
085        String encodeToString(IBase theElement) throws DataFormatException;
086
087        /**
088         * Encodes any FHIR element to a writer.
089         * If a {@link IBaseResource resource object} is passed in, the resource will be encoded using standard FHIR
090         * encoding rules. If a {@link org.hl7.fhir.instance.model.api.IPrimitiveType primitive datatype} is passed in,
091         * the string value of the primitive type is encoded. Any extensions on the primitive type are not encoded.
092         * If any other object is passed in, a fragment is encoded. The format of the fragment depends on the encoding:
093         * <ul>
094         *    <li><b>JSON</b>: The fragment is output as a simple JSON object, exactly as it would appear within an encoded resource.</li>
095         *    <li><b>XML</b>: The fragment is output as an XML element as it would appear within an encoded resource, however it is wrapped in an element called <code>&lt;element&gt;</code> in order to avoid producing a document with multiple root tags.</li>
096         *    <li><b>RDF/Turtle</b>: This mode is not supported and will throw an {@link ca.uhn.fhir.rest.server.exceptions.InternalErrorException}</li>
097         * </ul>
098         *
099         * @since 6.8.0
100         */
101        void encodeToWriter(IBase theElement, Writer theWriter) throws DataFormatException, IOException;
102
103        /**
104         * If not set to null (as is the default) this ID will be used as the ID in any
105         * resources encoded by this parser
106         */
107        IIdType getEncodeForceResourceId();
108
109        /**
110         * When encoding, force this resource ID to be encoded as the resource ID
111         */
112        @SuppressWarnings("UnusedReturnValue")
113        IParser setEncodeForceResourceId(IIdType theForceResourceId);
114
115        /**
116         * Which encoding does this parser instance produce?
117         */
118        EncodingEnum getEncoding();
119
120        /**
121         * Gets the preferred types, as set using {@link #setPreferTypes(List)}
122         *
123         * @return Returns the preferred types, or <code>null</code>
124         * @see #setPreferTypes(List)
125         */
126        List<Class<? extends IBaseResource>> getPreferTypes();
127
128        /**
129         * If set, when parsing resources the parser will try to use the given types when possible, in
130         * the order that they are provided (from highest to lowest priority). For example, if a custom
131         * type which declares to implement the Patient resource is passed in here, and the
132         * parser is parsing a Bundle containing a Patient resource, the parser will use the given
133         * custom type.
134         * <p>
135         * This feature is related to, but not the same as the
136         * {@link FhirContext#setDefaultTypeForProfile(String, Class)} feature.
137         * <code>setDefaultTypeForProfile</code> is used to specify a type to be used
138         * when a resource explicitly declares support for a given profile. This
139         * feature specifies a type to be used irrespective of the profile declaration
140         * in the metadata statement.
141         * </p>
142         *
143         * @param thePreferTypes The preferred types, or <code>null</code>
144         */
145        void setPreferTypes(List<Class<? extends IBaseResource>> thePreferTypes);
146
147        /**
148         * Returns true if resource IDs should be omitted
149         *
150         * @see #setOmitResourceId(boolean)
151         * @since 1.1
152         */
153        boolean isOmitResourceId();
154
155        /**
156         * If set to <code>true</code> (default is <code>false</code>) the ID of any resources being encoded will not be
157         * included in the output. Note that this does not apply to contained resources, only to root resources. In other
158         * words, if this is set to <code>true</code>, contained resources will still have local IDs but the outer/containing
159         * ID will not have an ID.
160         * <p>
161         * If the resource being encoded is a Bundle or Parameters resource, this setting only applies to the
162         * outer resource being encoded, not any resources contained within.
163         * </p>
164         *
165         * @param theOmitResourceId Should resource IDs be omitted
166         * @return Returns a reference to <code>this</code> parser so that method calls can be chained together
167         * @since 1.1
168         */
169        IParser setOmitResourceId(boolean theOmitResourceId);
170
171        /**
172         * If set to <code>true<code> (which is the default), resource references containing a version
173         * will have the version removed when the resource is encoded. This is generally good behaviour because
174         * in most situations, references from one resource to another should be to the resource by ID, not
175         * by ID and version. In some cases though, it may be desirable to preserve the version in resource
176         * links. In that case, this value should be set to <code>false</code>.
177         *
178         * @return Returns the parser instance's configuration setting for stripping versions from resource references when
179         * encoding. This method will return <code>null</code> if no value is set, in which case
180         * the value from the {@link ParserOptions} will be used (default is <code>true</code>)
181         * @see ParserOptions
182         */
183        Boolean getStripVersionsFromReferences();
184
185        /**
186         * If set to <code>true<code> (which is the default), resource references containing a version
187         * will have the version removed when the resource is encoded. This is generally good behaviour because
188         * in most situations, references from one resource to another should be to the resource by ID, not
189         * by ID and version. In some cases though, it may be desirable to preserve the version in resource
190         * links. In that case, this value should be set to <code>false</code>.
191         * <p>
192         * This method provides the ability to globally disable reference encoding. If finer-grained
193         * control is needed, use {@link #setDontStripVersionsFromReferencesAtPaths(String...)}
194         * </p>
195         *
196         * @param theStripVersionsFromReferences Set this to <code>false<code> to prevent the parser from removing resource versions from references (or <code>null</code> to apply the default setting from the {@link ParserOptions}
197         * @return Returns a reference to <code>this</code> parser so that method calls can be chained together
198         * @see #setDontStripVersionsFromReferencesAtPaths(String...)
199         * @see ParserOptions
200         */
201        IParser setStripVersionsFromReferences(Boolean theStripVersionsFromReferences);
202
203        /**
204         * Is the parser in "summary mode"? See {@link #setSummaryMode(boolean)} for information
205         *
206         * @see #setSummaryMode(boolean) for information
207         */
208        boolean isSummaryMode();
209
210        /**
211         * If set to <code>true</code> (default is <code>false</code>) only elements marked by the FHIR specification as
212         * being "summary elements" will be included.
213         * <p>
214         * It is possible to modify the default summary mode element inclusions
215         * for this parser instance by invoking {@link #setEncodeElements(Set)}
216         * or {@link #setDontEncodeElements(Collection)}. It is also possible to
217         * modify the default summary mode element inclusions for all parsers
218         * generated for a given {@link FhirContext} by accessing
219         * {@link FhirContext#getParserOptions()} followed by
220         * {@link ParserOptions#setEncodeElementsForSummaryMode(Collection)} and/or
221         * {@link ParserOptions#setDontEncodeElementsForSummaryMode(Collection)}.
222         * </p>
223         * <p>
224         * For compatibility reasons with other frameworks, when encoding a
225         * <code>CapabilityStatement</code> resource in summary mode, extensions
226         * are always encoded, even though the FHIR Specification does not consider
227         * them to be summary elements.
228         * </p>
229         *
230         * @return Returns a reference to <code>this</code> parser so that method calls can be chained together
231         */
232        IParser setSummaryMode(boolean theSummaryMode);
233
234        /**
235         * Parses a resource
236         *
237         * @param theResourceType The resource type to use. This can be used to explicitly specify a class which extends a built-in type
238         *                        (e.g. a custom type extending the default Patient class)
239         * @param theReader       The reader to parse input from. Note that the Reader will not be closed by the parser upon completion.
240         * @return A parsed resource
241         * @throws DataFormatException If the resource can not be parsed because the data is not recognized or invalid for any reason
242         */
243        <T extends IBaseResource> T parseResource(Class<T> theResourceType, Reader theReader) throws DataFormatException;
244
245        /**
246         * Parses a resource
247         *
248         * @param theResourceType The resource type to use. This can be used to explicitly specify a class which extends a built-in type
249         *                        (e.g. a custom type extending the default Patient class)
250         * @param theInputStream  The InputStream to parse input from, <b>with an implied charset of UTF-8</b>. Note that the InputStream will not be closed by the parser upon completion.
251         * @return A parsed resource
252         * @throws DataFormatException If the resource can not be parsed because the data is not recognized or invalid for any reason
253         */
254        <T extends IBaseResource> T parseResource(Class<T> theResourceType, InputStream theInputStream)
255                        throws DataFormatException;
256
257        /**
258         * Parses a resource
259         *
260         * @param theResourceType The resource type to use. This can be used to explicitly specify a class which extends a built-in type
261         *                        (e.g. a custom type extending the default Patient class)
262         * @param theString       The string to parse
263         * @return A parsed resource
264         * @throws DataFormatException If the resource can not be parsed because the data is not recognized or invalid for any reason
265         */
266        <T extends IBaseResource> T parseResource(Class<T> theResourceType, String theString) throws DataFormatException;
267
268        /**
269         * Parses a resource
270         *
271         * @param theReader The reader to parse input from. Note that the Reader will not be closed by the parser upon completion.
272         * @return A parsed resource. Note that the returned object will be an instance of {@link IResource} or
273         * {@link IAnyResource} depending on the specific FhirContext which created this parser.
274         * @throws DataFormatException If the resource can not be parsed because the data is not recognized or invalid for any reason
275         */
276        IBaseResource parseResource(Reader theReader) throws ConfigurationException, DataFormatException;
277
278        /**
279         * Parses a resource
280         *
281         * @param theInputStream The InputStream to parse input from (charset is assumed to be UTF-8).
282         *                       Note that the stream will not be closed by the parser upon completion.
283         * @return A parsed resource. Note that the returned object will be an instance of {@link IResource} or
284         * {@link IAnyResource} depending on the specific FhirContext which created this parser.
285         * @throws DataFormatException If the resource can not be parsed because the data is not recognized or invalid for any reason
286         */
287        IBaseResource parseResource(InputStream theInputStream) throws ConfigurationException, DataFormatException;
288
289        /**
290         * Parses a resource
291         *
292         * @param theMessageString The string to parse
293         * @return A parsed resource. Note that the returned object will be an instance of {@link IResource} or
294         * {@link IAnyResource} depending on the specific FhirContext which created this parser.
295         * @throws DataFormatException If the resource can not be parsed because the data is not recognized or invalid for any reason
296         */
297        IBaseResource parseResource(String theMessageString) throws ConfigurationException, DataFormatException;
298
299        /**
300         * If provided, specifies the elements which should NOT be encoded. Valid values for this
301         * field would include:
302         * <ul>
303         * <li><b>Patient</b> - Don't encode patient and all its children</li>
304         * <li><b>Patient.name</b> - Don't encode the patient's name</li>
305         * <li><b>Patient.name.family</b> - Don't encode the patient's family name</li>
306         * <li><b>*.text</b> - Don't encode the text element on any resource (only the very first position may contain a
307         * wildcard)</li>
308         * </ul>
309         * <p>
310         * Note: If {@link #setSummaryMode(boolean)} is set to <code>true</code>, then any
311         * elements specified using this method will be excluded even if they are
312         * summary elements.
313         * </p>
314         * <p>
315         * DSTU2 note: Note that values including meta, such as <code>Patient.meta</code>
316         * will work for DSTU2 parsers, but values with sub-elements on meta such
317         * as <code>Patient.meta.lastUpdated</code> will only work in
318         * DSTU3+ mode.
319         * </p>
320         *
321         * @param theDontEncodeElements The elements to not encode, or <code>null</code>
322         * @see #setEncodeElements(Set)
323         * @see ParserOptions#setDontEncodeElementsForSummaryMode(Collection)
324         */
325        IParser setDontEncodeElements(@Nullable Collection<String> theDontEncodeElements);
326
327        /**
328         * If provided, specifies the elements which should NOT be encoded. Valid values for this
329         * field would include:
330         * <ul>
331         * <li><b>Patient</b> - Don't encode patient and all its children</li>
332         * <li><b>Patient.name</b> - Don't encode the patient's name</li>
333         * <li><b>Patient.name.family</b> - Don't encode the patient's family name</li>
334         * <li><b>*.text</b> - Don't encode the text element on any resource (only the very first position may contain a
335         * wildcard)</li>
336         * </ul>
337         * <p>
338         * DSTU2 note: Note that values including meta, such as <code>Patient.meta</code>
339         * will work for DSTU2 parsers, but values with sub-elements on meta such
340         * as <code>Patient.meta.lastUpdated</code> will only work in
341         * DSTU3+ mode.
342         * </p>
343         *
344         * @param theDontEncodeElements The elements to not encode. Can be an empty list, but must not be <code>null</code>.
345         * @see #setDontEncodeElements(Collection)
346         * @see ParserOptions#setDontEncodeElementsForSummaryMode(Collection)
347         * @since 7.4.0
348         */
349        default IParser setDontEncodeElements(@Nonnull String... theDontEncodeElements) {
350                return setDontEncodeElements(CollectionUtil.newSet(theDontEncodeElements));
351        }
352
353        /**
354         * If provided, specifies the elements which should be encoded, to the exclusion of all others. Valid values for this
355         * field would include:
356         * <ul>
357         * <li><b>Patient</b> - Encode patient and all its children</li>
358         * <li><b>Patient.name</b> - Encode only the patient's name</li>
359         * <li><b>Patient.name.family</b> - Encode only the patient's family name</li>
360         * <li><b>*.text</b> - Encode the text element on any resource (only the very first position may contain a
361         * wildcard)</li>
362         * <li><b>*.(mandatory)</b> - This is a special case which causes any mandatory fields (min > 0) to be encoded</li>
363         * </ul>
364         * <p>
365         * Note: If {@link #setSummaryMode(boolean)} is set to <code>true</code>, then any
366         * elements specified using this method will be included even if they are not
367         * summary elements.
368         * </p>
369         *
370         * @param theEncodeElements The elements to encode, or <code>null</code>
371         * @see #setDontEncodeElements(Collection)
372         * @see #setEncodeElements(String...)
373         * @see ParserOptions#setEncodeElementsForSummaryMode(Collection)
374         */
375        IParser setEncodeElements(@Nullable Set<String> theEncodeElements);
376
377        /**
378         * If provided, specifies the elements which should be encoded, to the exclusion of all others. Valid values for this
379         * field would include:
380         * <ul>
381         * <li><b>Patient</b> - Encode patient and all its children</li>
382         * <li><b>Patient.name</b> - Encode only the patient's name</li>
383         * <li><b>Patient.name.family</b> - Encode only the patient's family name</li>
384         * <li><b>*.text</b> - Encode the text element on any resource (only the very first position may contain a
385         * wildcard)</li>
386         * <li><b>*.(mandatory)</b> - This is a special case which causes any mandatory fields (min > 0) to be encoded</li>
387         * </ul>
388         * <p>
389         * Note: If {@link #setSummaryMode(boolean)} is set to <code>true</code>, then any
390         * elements specified using this method will be included even if they are not
391         * summary elements.
392         * </p>
393         *
394         * @param theEncodeElements The elements to encode. Can be an empty list, but must not be <code>null</code>.
395         * @since 7.4.0
396         * @see #setEncodeElements(Set)
397         * @see ParserOptions#setEncodeElementsForSummaryMode(String...)
398         */
399        default IParser setEncodeElements(@Nonnull String... theEncodeElements) {
400                return setEncodeElements(CollectionUtil.newSet(theEncodeElements));
401        }
402
403        /**
404         * If set to <code>true</code> (default is false), the values supplied
405         * to {@link #setEncodeElements(Set)} will not be applied to the root
406         * resource (typically a Bundle), but will be applied to any sub-resources
407         * contained within it (i.e. search result resources in that bundle)
408         */
409        boolean isEncodeElementsAppliesToChildResourcesOnly();
410
411        /**
412         * If set to <code>true</code> (default is false), the values supplied
413         * to {@link #setEncodeElements(Set)} will not be applied to the root
414         * resource (typically a Bundle), but will be applied to any sub-resources
415         * contained within it (i.e. search result resources in that bundle)
416         */
417        void setEncodeElementsAppliesToChildResourcesOnly(boolean theEncodeElementsAppliesToChildResourcesOnly);
418
419        /**
420         * Registers an error handler which will be invoked when any parse errors are found
421         *
422         * @param theErrorHandler The error handler to set. Must not be null.
423         */
424        IParser setParserErrorHandler(IParserErrorHandler theErrorHandler);
425
426        /**
427         * Sets the "pretty print" flag, meaning that the parser will encode resources with human-readable spacing and
428         * newlines between elements instead of condensing output as much as possible.
429         *
430         * @param thePrettyPrint The flag
431         * @return Returns an instance of <code>this</code> parser so that method calls can be chained together
432         */
433        IParser setPrettyPrint(boolean thePrettyPrint);
434
435        /**
436         * Sets the server's base URL used by this parser. If a value is set, resource references will be turned into
437         * relative references if they are provided as absolute URLs but have a base matching the given base.
438         *
439         * @param theUrl The base URL, e.g. "<a href="http://example.com/base">http://example.com/base</a>"
440         * @return Returns an instance of <code>this</code> parser so that method calls can be chained together
441         */
442        IParser setServerBaseUrl(String theUrl);
443
444        /**
445         * If set to <code>true</code> (which is the default), the Bundle.entry.fullUrl will override the Bundle.entry.resource's
446         * resource id if the fullUrl is defined. This behavior happens when parsing the source data into a Bundle object. Set this
447         * to <code>false</code> if this is not the desired behavior (e.g. the client code wishes to perform additional
448         * validation checks between the fullUrl and the resource id).
449         *
450         * @param theOverrideResourceIdWithBundleEntryFullUrl Set this to <code>false</code> to prevent the parser from overriding resource ids with the
451         *                                                    Bundle.entry.fullUrl (or <code>null</code> to apply the default setting from the {@link ParserOptions})
452         * @return Returns a reference to <code>this</code> parser so that method calls can be chained together
453         * @see ParserOptions
454         */
455        IParser setOverrideResourceIdWithBundleEntryFullUrl(Boolean theOverrideResourceIdWithBundleEntryFullUrl);
456
457        /**
458         * If set to <code>true</code> (default is <code>false</code>), narratives will not be included in the encoded
459         * values.
460         */
461        IParser setSuppressNarratives(boolean theSuppressNarratives);
462
463        /**
464         * Returns the value supplied to {@link IParser#setDontStripVersionsFromReferencesAtPaths(String...)}
465         * or <code>null</code> if no value has been set for this parser (in which case the default from
466         * the {@link ParserOptions} will be used).
467         *
468         * @see #setDontStripVersionsFromReferencesAtPaths(String...)
469         * @see #setStripVersionsFromReferences(Boolean)
470         * @see ParserOptions
471         */
472        Set<String> getDontStripVersionsFromReferencesAtPaths();
473
474        /**
475         * If supplied value(s), any resource references at the specified paths will have their
476         * resource versions encoded instead of being automatically stripped during the encoding
477         * process. This setting has no effect on the parsing process.
478         * <p>
479         * This method provides a finer-grained level of control than {@link #setStripVersionsFromReferences(Boolean)}
480         * and any paths specified by this method will be encoded even if {@link #setStripVersionsFromReferences(Boolean)}
481         * has been set to <code>true</code> (which is the default)
482         * </p>
483         *
484         * @param thePaths A collection of paths for which the resource versions will not be removed automatically
485         *                 when serializing, e.g. "Patient.managingOrganization" or "AuditEvent.object.reference". Note that
486         *                 only resource name and field names with dots separating is allowed here (no repetition
487         *                 indicators, FluentPath expressions, etc.). Set to <code>null</code> to use the value
488         *                 set in the {@link ParserOptions}
489         * @return Returns a reference to <code>this</code> parser so that method calls can be chained together
490         * @see #setStripVersionsFromReferences(Boolean)
491         * @see ParserOptions
492         */
493        IParser setDontStripVersionsFromReferencesAtPaths(String... thePaths);
494
495        /**
496         * If supplied value(s), any resource references at the specified paths will have their
497         * resource versions encoded instead of being automatically stripped during the encoding
498         * process. This setting has no effect on the parsing process.
499         * <p>
500         * This method provides a finer-grained level of control than {@link #setStripVersionsFromReferences(Boolean)}
501         * and any paths specified by this method will be encoded even if {@link #setStripVersionsFromReferences(Boolean)}
502         * has been set to <code>true</code> (which is the default)
503         * </p>
504         *
505         * @param thePaths A collection of paths for which the resource versions will not be removed automatically
506         *                 when serializing, e.g. "Patient.managingOrganization" or "AuditEvent.object.reference". Note that
507         *                 only resource name and field names with dots separating is allowed here (no repetition
508         *                 indicators, FluentPath expressions, etc.). Set to <code>null</code> to use the value
509         *                 set in the {@link ParserOptions}
510         * @return Returns a reference to <code>this</code> parser so that method calls can be chained together
511         * @see #setStripVersionsFromReferences(Boolean)
512         * @see ParserOptions
513         */
514        IParser setDontStripVersionsFromReferencesAtPaths(Collection<String> thePaths);
515}