Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 3 additions & 0 deletions SIS/clarin/data/formats/fCSV.xml
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,8 @@
<keyword>tabular format</keyword>
<keyword type="SSO">W3C</keyword>
<extId type="LOC">fdd000323</extId>
<extDoc type="enWiki">Comma-separated_values</extDoc>
<extDoc type="formatWiki">CSV</extDoc>
<info type="description">
<p>"CSV is one of the most popular formats for publishing data on the web. It is concise, easy
to understand by both humans and computers, and aligns nicely to the tabular nature of most
Expand Down Expand Up @@ -38,6 +40,7 @@
<li><a href="https://specs.frictionlessdata.io/csv-dialect/">CSV Dialect</a> -- a set of modelling parameters for describing various dialects of CSV</li>
</ul>
</info>
<relation target="tabularDataSpec" type="isDefinedBy"/>
<mimeType>text/csv</mimeType>
<fileExt>.csv</fileExt>
<formatFamily>Plain.Delimited</formatFamily>
Expand Down
10 changes: 7 additions & 3 deletions SIS/clarin/data/formats/fDICOM.xml
Original file line number Diff line number Diff line change
Expand Up @@ -11,16 +11,20 @@
<!-- this is also video, and can be lossy... messy -->
<extId type="Wikidata">Q28205908</extId>
<extId type="PRONOM">fmt/574</extId>
<extDoc type="enWiki">DICOM</extDoc>
<extDoc type="formatWiki">DICOM</extDoc>
<info type="description">
<p>See <a href="https://en.wikipedia.org/wiki/DICOM">https://en.wikipedia.org/wiki/DICOM</a>.</p>
<p>Please feel welcome to supply the description of this format file via GitHub: either as an
<a href="https://github.com/clarin-eric/standards/issues">issue report</a>, or as a pull
request after forking or browsing the
<a href="https://github.com/clarin-eric/standards/tree/formats/SIS/clarin/data/formats">code under the 'formats' branch</a>.</p>
<!-- Many image compression formats possible, https://en.wikipedia.org/wiki/DICOM -->
<p>Standardised both by ISO (ISO 12052) and NEMA (National Electrical Manufacturers
Association). (The standards relation link looks weird pending work on the proper visualisation.
Feel welcome to join us.)</p>
</info>
<!--<relation target="SpecDICOM" type="isDefinedBy"/>
ISO 12052, also own committe, and the primary standards body seems to be the NEMA: National Electrical Manufacturers Association
<relation target="SpecDICOM" type="isDefinedBy"/>
<!-- ISO 12052, also own committee, and the primary standards body seems to be the NEMA: National Electrical Manufacturers Association
-->
<mimeType>application/dicom</mimeType>
<fileExt recommended="yes">.dcm</fileExt>
Expand Down
1 change: 1 addition & 0 deletions SIS/clarin/data/formats/fODF.xml
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,7 @@
<keyword>umbrella format</keyword>
<keyword type="SSO">OASIS</keyword>
<extId type="LOC">fdd000247</extId>
<extDoc type="enWiki">OpenDocument</extDoc>
<info type="description" umbrella="yes">
<p>"The Open Document Format for Office Applications (ODF), also known as OpenDocument, standardized as ISO 26300, is an open
file format for word processing documents, spreadsheets, presentations and graphics and using ZIP-compressed XML files.
Expand Down
1 change: 1 addition & 0 deletions SIS/clarin/data/formats/fTextPlain.xml
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,7 @@
<keyword>text format</keyword>
<!-- what other keywords should we add here? -->
<extDoc type="enWiki">Plain_text</extDoc>
<extDoc type="formatWiki">Plain_text</extDoc>
<info type="description">
<p>Plain text is a pure sequence of character codes. (...) Plain text represents character
content only, not its appearance. (...) Plain text must contain enough information to permit
Expand Down
79 changes: 23 additions & 56 deletions SIS/clarin/data/recommendations/ILC4CLARIN-recommendation.xml
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@
<?xml-model href="../../schemas/recommendation.xsd" type="application/xml" schematypens="http://purl.oclc.org/dsdl/schematron"?>
<recommendation xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../../schemas/recommendation.xsd">
<header>
<lastUpdateCommitID>147cb5ea659a5752efd819898b43da23e00c6a77</lastUpdateCommitID>
<lastUpdateCommitID>88fa1a1f69809fa389ab2c59a19bdf0a5ecc3f25</lastUpdateCommitID>
<filter>
<centreID>ILC4CLARIN</centreID>
</filter>
Expand All @@ -20,81 +20,48 @@
</nodeInfo>
</centre>
</header>
<info><!--use p, ul, ol elements here--></info>
<info><p>Formats extracted from the uploaded dataset and matched against
CLARIN Standards recommendations.</p>
<p>This list has been submitted by Riccardo Del Gratta in May 2026.</p>
<p>No active curator has yet been appointed for the recommendations.</p></info>
<formats>
<format id="fMOV">
<domain>Audiovisual Source Language Data</domain>
<level>recommended</level>
</format>
<format id="fMPEG1">
<domain>Audiovisual Source Language Data</domain>
<format id="fXML">
<domain>Metadata</domain>
<level>recommended</level>
</format>
<format id="fWAVE">
<domain>Audiovisual Source Language Data</domain>
<format id="fTXT">
<domain>Textual Source Language Data</domain>
<level>recommended</level>
</format>
<format id="fHTML">
<domain>Documentation</domain>
<format id="fCSV">
<domain>Text Annotation</domain>
<level>recommended</level>
</format>
<format id="fLaTeX">
<format id="fRTF">
<domain>Documentation</domain>
<level>recommended</level>
<level>acceptable</level>
</format>
<format id="fPDF">
<domain>Documentation</domain>
<level>acceptable</level>
</format>
<format id="fTeX">
<domain>Documentation</domain>
<level>recommended</level>
</format>
<format id="fXML">
<domain>Documentation</domain>
<level>recommended</level>
</format>
<format id="fGIF">
<domain>Image Source Language Data</domain>
<level>recommended</level>
</format>
<format id="fJPEG">
<domain>Image Source Language Data</domain>
<level>recommended</level>
</format>
<format id="fTIFF">
<domain>Image Source Language Data</domain>
<level>recommended</level>
</format>
<format id="fRDFXML">
<domain>Text Annotation</domain>
<level>recommended</level>
</format>
<format id="fXML">
<domain>Text Annotation</domain>
<level>recommended</level>
</format>
<format id="fODT">
<domain>Textual Source Language Data</domain>
<level>recommended</level>
</format>
<format id="fPDF">
<format id="fDOCX">
<domain>Textual Source Language Data</domain>
<level>acceptable</level>
</format>
<format id="fTextPlain">
<domain>Textual Source Language Data</domain>
<level>recommended</level>
<format id="fXLSX">
<domain>Metadata</domain>
<level>acceptable</level>
</format>
<format id="fCSS">
<domain>Tool Support</domain>
<level>recommended</level>
<format id="fPPTX">
<domain>Documentation</domain>
<level>acceptable</level>
</format>
<format id="fGZIP">
<format id="fZIP">
<domain>Packaging</domain>
<level>recommended</level>
<level>acceptable</level>
</format>
<format id="fZIP">
<format id="fGZIP">
<domain>Packaging</domain>
<level>recommended</level>
</format>
Expand Down