... | ... | @@ -10,7 +10,7 @@ The 'name' field is the name of the transcription in which the text content will |
|
|
By defaults the segmentation for the selected images, both regions and lines, will be deleted. You can disable this behavior by unchecking 'Override existing segmentation.', in which case the system will try to match the lines and regions by their `ID` attribute. The old content for matching lines is then stored in its history and new lines/regions are created when no matching existing element are found.
|
|
|
|
|
|
### Alto
|
|
|
Upload a valid [ALTO 4 XML](https://en.wikipedia.org/wiki/ALTO_(XML)) file for segmentation and transcriptions.
|
|
|
Upload a valid [ALTO 4 XML](https://en.wikipedia.org/wiki/ALTO_(XML)) (4.0->4.2) file for segmentation and transcriptions.
|
|
|
|
|
|
A basic example:
|
|
|
```xml
|
... | ... | @@ -24,13 +24,20 @@ A basic example: |
|
|
<fileName>my_image.png</fileName>
|
|
|
</sourceImageInformation>
|
|
|
</Description>
|
|
|
<Tags>
|
|
|
<OtherTag ID="type1" LABEL="Some region type" DESCRIPTION="block type"/>
|
|
|
<OtherTag ID="type2" LABEL="Some line type" DESCRIPTION="line type"/>
|
|
|
</Tags>
|
|
|
<Layout>
|
|
|
<Page WIDTH="850" HEIGHT="1083" PHYSICAL_IMG_NR="0" ID="page_0">
|
|
|
<PrintSpace HPOS="0" VPOS="0" WIDTH="850" HEIGHT="1083">
|
|
|
<TextBlock HPOS="0" VPOS="0" ID="textblock_0" WIDTH="850" HEIGHT="1083">
|
|
|
<TextLine ID="line_0" HPOS="160" VPOS="771" WIDTH="25" HEIGHT="28">
|
|
|
<TextBlock HPOS="0" VPOS="0" ID="textblock_0" WIDTH="850" HEIGHT="1083" TAGREFS="type1">
|
|
|
<Shape>
|
|
|
<Polygon POINTS="0 0 850 0 850 1083 0 1083"/>
|
|
|
</Shape>
|
|
|
<TextLine ID="line_0" HPOS="160" VPOS="771" WIDTH="25" HEIGHT="28" TAGREFS="type2">
|
|
|
<Shape>
|
|
|
<Polygon POINTS="160,771,185,799"/>
|
|
|
<Polygon POINTS="160 771 185 799"/>
|
|
|
</Shape>
|
|
|
<String ID="segment_0" CONTENT="This is an example" HPOS="160" VPOS="771" WIDTH="25" HEIGHT="28" WC="0.9995"></String>
|
|
|
</TextLine>
|
... | ... | @@ -96,9 +103,9 @@ example of full PageXML file: |
|
|
<RegionRefIndexed index="1" regionRef="r2"/>
|
|
|
</OrderedGroup>
|
|
|
</ReadingOrder>
|
|
|
<TextRegion orientation="0.0" id="r2">
|
|
|
<TextRegion orientation="0.0" id="r2" custom="structure {type:Some region type;}">
|
|
|
<Coords points="113,29 113,1021 697,1021 697,29"/>
|
|
|
<TextLine id="r2l1">
|
|
|
<TextLine id="r2l1" custom="structure {type:Some line type;}">
|
|
|
<Coords points="150,64 346,60 425,81 460,60 616,64 621,5 396,2 328,3 304,21 271,4 232,23 150,17"/>
|
|
|
<Baseline points="155,55 180,55 206,55 231,55 257,55 283,55 308,55 334,56 359,56 385,56 411,56 436,56 462,56 487,56 513,55 539,55 564,55 590,54 616,53"/>
|
|
|
<TextEquiv>
|
... | ... | |