Spaces:

Riksarkivet
/

htr_demo

Sleeping

App Files Files Community

amlpai04 commited on 29 days ago

Commit

e6c2b26

1 Parent(s): 8fa0da0

radical changes for workflow app instead

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

README.md +2 -0
app/assets/__init__.py +0 -0
app/assets/examples.py +0 -27
app/assets/images/.gitkeep +0 -0
app/assets/templates/1_simple.yaml +16 -0
app/assets/templates/2_nested.yaml +22 -0
app/assets/templates/c_nested_labels.yaml +41 -0
app/assets/templates/c_nested_reading_order.yaml +24 -0
app/assets/templates/c_nested_with_filter.yaml +28 -0
app/assets/templates/c_simple_gensettings.yaml +21 -0
app/assets/templates/c_simple_multi_output.yaml +24 -0
app/backend.py +0 -0
app/content/ENG/changelog_roadmap/changelog.md +0 -14
app/content/ENG/changelog_roadmap/old_changelog.md +0 -39
app/content/ENG/changelog_roadmap/roadmap.md +0 -27
app/content/ENG/contributions/contributions.md +0 -33
app/content/ENG/contributions/huminfra_image.md +0 -3
app/content/ENG/contributions/riksarkivet_image.md +0 -3
app/content/ENG/duplicate_api/api1.md +0 -11
app/content/ENG/duplicate_api/api2.md +0 -3
app/content/ENG/duplicate_api/api_code1.md +0 -11
app/content/ENG/duplicate_api/api_code2.md +0 -26
app/content/ENG/duplicate_api/duplicate.md +0 -26
app/content/ENG/faq_discussion/discussion.md +0 -7
app/content/ENG/faq_discussion/faq.md +0 -13
app/content/ENG/htrflow/htrflow_col1.md +0 -18
app/content/ENG/htrflow/htrflow_col2.md +0 -23
app/content/ENG/htrflow/htrflow_row1.md +0 -3
app/content/ENG/htrflow/htrflow_tab1.md +0 -7
app/content/ENG/htrflow/htrflow_tab2.md +0 -7
app/content/ENG/htrflow/htrflow_tab3.md +0 -7
app/content/ENG/htrflow/htrflow_tab4.md +0 -7
app/content/NOR/htrflow/htrflow_col1.md +0 -18
app/content/NOR/htrflow/htrflow_col2.md +0 -23
app/content/NOR/htrflow/htrflow_row1.md +0 -3
app/content/NOR/htrflow/htrflow_tab1.md +0 -7
app/content/NOR/htrflow/htrflow_tab2.md +0 -7
app/content/NOR/htrflow/htrflow_tab3.md +0 -7
app/content/NOR/htrflow/htrflow_tab4.md +0 -7
app/content/SWE/htrflow/htrflow_col1.md +0 -18
app/content/SWE/htrflow/htrflow_col2.md +0 -23
app/content/SWE/htrflow/htrflow_row1.md +0 -3
app/content/SWE/htrflow/htrflow_tab1.md +0 -7
app/content/SWE/htrflow/htrflow_tab2.md +0 -7
app/content/SWE/htrflow/htrflow_tab3.md +0 -7
app/content/SWE/htrflow/htrflow_tab4.md +0 -7
app/gradio_config.py +0 -7
app/main.py +12 -71
app/plot_viewer.py +0 -200
app/tabs/adv_htrflow_tab.py +11 -37

README.md CHANGED Viewed

@@ -17,4 +17,6 @@ datasets:
     "Riksarkivet/placeholder_line_segmentation",
     "Riksarkivet/placeholder_htr",
   ]
 ---

     "Riksarkivet/placeholder_line_segmentation",
     "Riksarkivet/placeholder_htr",
   ]
+license: mit
+short_description: Transform research papers and mathematical concepts into stu
 ---

app/assets/__init__.py DELETED Viewed

File without changes

app/assets/examples.py DELETED Viewed

@@ -1,27 +0,0 @@
-import io
-import datasets
-from PIL import Image
-class DemoImages:
-    def __init__(self, url="Riksarkivet/test_images_demo", cache_dir=".app/assets/images/.cache_images"):
-        if not hasattr(self, "images_datasets"):
-            self.images_datasets = datasets.load_dataset(url, cache_dir=cache_dir, split="train")
-            self.example_df = self.images_datasets.to_pandas()
-            self.examples_list = self.convert_bytes_to_images()
-    def convert_bytes_to_images(self):
-        examples_list = []
-        for index, row in self.example_df.iterrows():
-            image_bytes = row["image"]["bytes"]
-            image = Image.open(io.BytesIO(image_bytes))
-            path_to_image = f"./app/assets/images/image_{index}.jpg"
-            image.save(path_to_image)
-            description = row["text"]
-            examples_list.append([description, "Nested segmentation", path_to_image])
-        return examples_list

app/assets/images/.gitkeep DELETED Viewed

File without changes

app/assets/templates/1_simple.yaml ADDED Viewed

	@@ -0,0 +1,16 @@

+steps:
+- step: Segmentation
+  settings:
+    model: yolo
+    model_settings:
+      model: Riksarkivet/yolov9-lines-within-regions-1
+- step: TextRecognition
+  settings:
+    model: TrOCR
+    model_settings:
+      model: Riksarkivet/trocr-base-handwritten-hist-swe-2
+- step: OrderLines
+- step: Export
+  settings:
+    format: txt
+    dest: outputs

app/assets/templates/2_nested.yaml ADDED Viewed

	@@ -0,0 +1,22 @@

+steps:
+- step: Segmentation
+  settings:
+    model: yolo
+    model_settings:
+       model: Riksarkivet/yolov9-regions-1
+- step: Segmentation
+  settings:
+    model: yolo
+    model_settings:
+      model: Riksarkivet/yolov9-lines-within-regions-1
+- step: TextRecognition
+  settings:
+    model: TrOCR
+    model_settings:
+      model: Riksarkivet/trocr-base-handwritten-hist-swe-2
+- step: OrderLines
+- step: Export
+  settings:
+    format: txt
+    dest: text-outputs

app/assets/templates/c_nested_labels.yaml ADDED Viewed

	@@ -0,0 +1,41 @@

+steps:
+- step: Segmentation
+  settings:
+    model: yolo
+    model_settings:
+       model: Riksarkivet/yolov9-regions-1
+    generation_settings:
+       batch_size: 2
+- step: Segmentation
+  settings:
+    model: yolo
+    model_settings:
+       model: Riksarkivet/yolov9-lines-within-regions-1
+    generation_settings:
+        batch_size: 2
+- step: TextRecognition
+  settings:
+    model: WordLevelTrocr
+    model_settings:
+       model: Riksarkivet/trocr-base-handwritten-hist-swe-2
+    generation_settings:
+       batch_size: 4
+       num_beams: 1
+- step: ReadingOrderMarginalia
+  settings:
+    two_page: auto
+- step: Export
+  settings:
+    dest: outputs/alto
+    format: alto
+- step: Export
+  settings:
+    dest: outputs/page
+    format: page
+labels:
+  level_labels:
+    - region
+    - line
+    - word
+  sep: _
+  template: "{label}{number}"

app/assets/templates/c_nested_reading_order.yaml ADDED Viewed

	@@ -0,0 +1,24 @@

+steps:
+- step: Segmentation
+  settings:
+    model: yolo
+    model_settings:
+       model: Riksarkivet/yolov9-regions-1
+- step: Segmentation
+  settings:
+    model: yolo
+    model_settings:
+      model: Riksarkivet/yolov9-lines-within-regions-1
+- step: TextRecognition
+  settings:
+    model: TrOCR
+    model_settings:
+      model: Riksarkivet/trocr-base-handwritten-hist-swe-2
+- step: ReadingOrderMarginalia
+  settings:
+    two_page: always
+- step: Export
+  settings:
+    format: txt
+    dest: text-outputs

app/assets/templates/c_nested_with_filter.yaml ADDED Viewed

	@@ -0,0 +1,28 @@

+steps:
+- step: Segmentation
+  settings:
+    model: yolo
+    model_settings:
+       model: Riksarkivet/yolov9-regions-1
+- step: Segmentation
+  settings:
+    model: yolo
+    model_settings:
+      model: Riksarkivet/yolov9-lines-within-regions-1
+- step: TextRecognition
+  settings:
+    model: TrOCR
+    model_settings:
+      model: Riksarkivet/trocr-base-handwritten-hist-swe-2
+- step: OrderLines
+- step: Export
+  settings:
+    format: txt
+    dest: raw-outputs
+- step: RemoveLowTextConfidenceLines
+  settings:
+    threshold: 0.95
+- step: Export
+  settings:
+    format: txt
+    dest: cleaned-outputs

app/assets/templates/c_simple_gensettings.yaml ADDED Viewed

	@@ -0,0 +1,21 @@

+steps:
+- step: Segmentation
+  settings:
+    model: yolo
+    model_settings:
+      model: Riksarkivet/yolov9-lines-within-regions-1
+    generation_settings:
+       batch_size: 2
+- step: TextRecognition
+  settings:
+    model: TrOCR
+    model_settings:
+      model: Riksarkivet/trocr-base-handwritten-hist-swe-2
+    generation_settings:
+       batch_size: 4
+       num_beams: 1
+- step: OrderLines
+- step: Export
+  settings:
+    format: txt
+    dest: outputs

app/assets/templates/c_simple_multi_output.yaml ADDED Viewed

	@@ -0,0 +1,24 @@

+steps:
+- step: Segmentation
+  settings:
+    model: yolo
+    model_settings:
+      model: Riksarkivet/yolov9-lines-within-regions-1
+- step: TextRecognition
+  settings:
+    model: TrOCR
+    model_settings:
+      model: Riksarkivet/trocr-base-handwritten-hist-swe-2
+- step: OrderLines
+- step: Export
+  settings:
+    format: txt
+    dest: text-outputs
+- step: Export
+  settings:
+    format: page
+    dest: page-outputs
+- step: Export
+  settings:
+    format: alto
+    dest: alto-outputs

app/backend.py DELETED Viewed

File without changes

app/content/ENG/changelog_roadmap/changelog.md DELETED Viewed

@@ -1,14 +0,0 @@
-## Changelog
-All notable changes to HTRFLOW will be documented here.
-### [0.1.0] - 2023-11-08
-#### Added
-- Support for TROCR -> Latin and Eng model
-- New feature! Compare different runs with GT, see tab **Fast track** > **Compare**
-#### Fixed
-- Fixed bug for Docker and running app locally, [issue](https://github.com/Riksarkivet/HTRFLOW/issues/2)

app/content/ENG/changelog_roadmap/old_changelog.md DELETED Viewed

@@ -1,39 +0,0 @@
-## Changelog
-All notable changes to HTRFLOW will be documented here.
-### [0.0.2] - 2023-11-01
-#### Added
-- Better documentation for API, see **Overview** > **Duplicating for own use & API**
-- Better documentation for restrictions of app, see **Overview** > **HTRFLOW**
-#### Fixed
-- Fixed bug for API, [issue](https://github.com/Riksarkivet/HTRFLOW/issues/2)
-#### Changed
-- Changed named for **FAQ & Discussion** to **FAQ & Contact**
----
-### [0.0.1] - 2023-10-23
-#### Added
-- Added a new feature to **Stepwise** > **Explore results** > New Text diff and CER component
-#### Fixed
-- Fixed naming conventions of tabs in app so they are more coherent with the code.
-#### Changed
-- Changed the layout in both Fast track and Stepwise to improve the UX
-  - Examples are viewed in the middle of the layout
-  - "Advanced settings" are initial hidden
-- Removed **help** tab for now (documentation of Fast track and Stepwise will come in a later release)

app/content/ENG/changelog_roadmap/roadmap.md DELETED Viewed

@@ -1,27 +0,0 @@
-## Roadmap
-Our roadmap is where you can learn about what features we're working on. Have any questions or comments about items on the roadmap? See **Overview** > **FAQ & Discussion** for feedback or collaboration.
-### Working on
-- Release Training and Eval data on HuggingFace
-- Add support for TrOCR models as Text recognition model:
-  - Train a TrOCR model specialized on Swedish historical handwritten text.
-- Optimize the backend of the application:
-  - Package the code
-  - Add support for batch inference
-  - Start a collaborative open source project
-### Backlog
-- Initial document classifier
-- Add support for Different segmentation strategies:
-  - Table detection
-  - Different text layouts with multiple columns
-- Add more endpoints for rest api and add a more extensive documentation

app/content/ENG/contributions/contributions.md DELETED Viewed

@@ -1,33 +0,0 @@
-## HTRFLOW – Contributions
-The AI models used in HTRFLOW is the result of a collaborative effort, involving the National Archives in both Sweden and Finland, in partnership with the Stockholm City Archives, Jämtlands läns fornskriftsällskap, citizen science volunteers and researchers from Stockholm and Uppsala Universities.
-Several datasets have been created by participants through Citizen Science using the Handwritten Text Recognition (HTR) software, Transkribus, provided by [READ-COOP SCE](https://readcoop.eu/) .
-### Archives used to train models for HTRFLOW
-[Svea hovrätt (Renskrivna protokoll), 1713–1735](https://sok.riksarkivet.se/arkiv/H2hpDbNn14scxjzdWqAaJ1)
-[Bergmästaren i Nora m fl bergslag (Hammartingsprotokoll), 1698–1765](https://sok.riksarkivet.se/arkiv/M5Fe2TT9rH6cxG02H087k3)
-[Trolldomskommissionen, mainly 1670s](https://sok.riksarkivet.se/trolldomskommissionen)
-[Bergskollegium, 1718–1758](https://sok.riksarkivet.se/arkiv/SMFky31ekQ80Qsk0UCZZE2)
-[Jämtlands domsaga, 1647–1688](https://sok.riksarkivet.se/arkiv/2l4NYFT8rH6cxG02H087k3)
-[Stockholms domkapitel, 1728–1759](https://sok.riksarkivet.se/arkiv/etg1tyeEaIPMBzKbUKTjw1)
-[Politikollegiet, 1729–1759](https://sok.riksarkivet.se/arkiv/1lQnXIDiKaYxRLBlK1dGF3)
-[Göteborgs poliskammare före 1900 (Detektiva polisens rapportböcker), 1868–1901](https://sok.riksarkivet.se/arkiv/oLTOi9yxweZJUG018W43t3)
-[Renovated Court Records, the National Archives of Finland, 1800s](https://tuomiokirjat.kansallisarkisto.fi/)
-### Ongoing research collaborations
-[Transcription node Sweden – machine interpretation and citizen research combined](https://riksarkivet.se/forskning), Swedish National Archives and University of Gothenburg, funded by the Swedish National Heritage Board.
-[Mapping the geographies of early modern mining knowledge. A digital history of the study tours of the Swedish Bureau of Mines, 1691–1826](https://www.idehist.uu.se/forskning/projekt/den-tidigmoderna-bergsvetenskapens-geografier), Uppsala University and Stockholm University, funded by the Swedish Research Council.
-The Swedish National Archives' research and development on HTR is part of the Swedish national infrastructure Huminfra. [Click here](https://riksarkivet.se/huminfra) for more information.

app/content/ENG/contributions/huminfra_image.md DELETED Viewed

@@ -1,3 +0,0 @@
-<a href="https://www.huminfra.se/">
-<img src="https://github.com/Borg93/htr_gradio_file_placeholder/blob/main/Huminfra_logo.png?raw=true" width="17%" align="left" margin-right="100" />
-</a>

app/content/ENG/contributions/riksarkivet_image.md DELETED Viewed

@@ -1,3 +0,0 @@
-<a href="https://riksarkivet.se">
-<img src="https://raw.githubusercontent.com/Borg93/Riksarkivet_docs/main/docs/assets/fav-removebg-preview.png" width="17%" align="right" margin-right="100" />
-</a>

app/content/ENG/duplicate_api/api1.md DELETED Viewed

@@ -1,11 +0,0 @@
-## Usage of Client API
-If you prefer to run **Fast track** programmatically, we offer an API for that purpose.
-- [REST API](https://riksarkivet-htr-demo.hf.space/?view=api)
-- Docuemtnation for gradio client with [python](https://www.gradio.app/guides/getting-started-with-the-python-client)
-- Docuemtnation for gradio client with [javascript](https://www.gradio.app/guides/getting-started-with-the-js-client)
-**Note**: More extensive APIs and documentation can be added in the future upon request.
-See example below for usage of API in python:

app/content/ENG/duplicate_api/api2.md DELETED Viewed

@@ -1,3 +0,0 @@
-### Output from the api
-The output from the api is currently in the format of Page XML, which can be imported into this [viewer](https://huggingface.co/spaces/Riksarkivet/Viewer_demo).

app/content/ENG/duplicate_api/api_code1.md DELETED Viewed

@@ -1,11 +0,0 @@
-from gradio_client import Client # pip install gradio_client
-# Change url to your client (localhost: http://127.0.0.1:7860/)
-client = Client("https://huggingface.co/spaces/Riksarkivet/htr_demo")
-job = client.submit(
-"https://your.image.url.or.pah.jpg",
-api_name="/run_htr_pipeline",
-)
-print(job.result())

app/content/ENG/duplicate_api/api_code2.md DELETED Viewed

@@ -1,26 +0,0 @@
-Loaded as API: http://127.0.0.1:7860/ ✔
-<?xml version="1.0" encoding="UTF-8"?>
-<PcGts xmlns="http://schema.primaresearch.org/PAGE/gts/pagecontent/2013-07-15" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://schema.primaresearch.org/PAGE/gts/pagecontent/2013-07-15 http://schema.primaresearch.org/PAGE/gts/pagecontent/2013-07-15/pagecontent.xsd">
-    <Metadata>
-        <Creator>Swedish National Archives</Creator>
-        <Created>2023-08-21, 13:28:06</Created>
-    </Metadata>
-    <Page imageFilename="page_xml.xml" imageWidth="4885" imageHeight="4066">
-    <TextRegion id="region_0" custom="readingOrder {index:0;}">
-        <Coords points="1477,265 1467,217 1440,201 1370,211 1248,203 1127,224 1067,224 1003,212 844,247 766,243 747,261 742,280 751,332 766,346 1258,341 1357,332 1439,341 1468,327"/>
-    <TextLine id="line_region_0_0" custom="readingOrder {index:0;}">
-                <Coords points="1458,248 1443,222 1449,200 1412,215 1366,200 1325,207 1302,200 1241,200 1235,206 1205,200 1187,210 1085,222 957,206 795,239 769,273 771,333 783,340 1445,333 1450,324"/>
-                                <TextEquiv>
-            <Unicode>År 1865.</Unicode>
-        </TextEquiv>
-                        <PredScore pred_score="0.9482"/>
-            </TextLine>
-    </TextRegion>
-    <TextRegion id="region_1" custom="readingOrder {index:1;}">
-......................................
-    </TextRegion>
-    </Page>
-</PcGts>
-# Output is truncated. View as a scrollable element or open in a text editor. Adjust cell output settings...

app/content/ENG/duplicate_api/duplicate.md DELETED Viewed

@@ -1,26 +0,0 @@
-## Duplicating for own use
-Please be aware of certain limitations when using the application:
-- This application is primarily designed for demonstration purposes and is not intended for scaling up HTR.
-- Currently, the Swedish National Archives has constraints on sharing hardware, leading to a queue system for high demand.
-- The demo is hosted on Hugging Face domains, and they may rate-limit you if there's an excessive number of requests in a short timeframe, especially when using the API.
-For those requiring heavy usage, you can conveniently duplicate the application.
-- Duplicate [application](https://huggingface.co/spaces/Riksarkivet/htr_demo?duplicate=true).
-By doing so, you'll create your own private app, which allows for unlimited requests without any restrictions. The image below shows the minimum hardware you need to use if you don't have access to hardware youself:
-<figure>
-<img src="https://raw.githubusercontent.com/Borg93/htr_gradio_file_placeholder/main/hardware_example.png" alt="HTR_tool" style="width:75%; display: block; margin-left: auto; margin-right:auto;" >
-<figcaption style="text-align: center;"> <em> Figure - Choose a hardware that has atleast a GPU </em></figcaption>
-</figure>
-For individuals with access to dedicated hardware, additional options are available. You have the flexibility to run this application on your own machine utilizing Docker, or by cloning the repository directly. Doing so allows you to leverage your hardware's capabilities to their fullest extent.
-- [Clone with Docker](https://huggingface.co/spaces/Riksarkivet/htr_demo?docker=true)
-- [Clone Repo](https://huggingface.co/spaces/Riksarkivet/htr_demo/settings?clone=true)
-**Note**: To take advantage of CUDA for accelerated inferences, an Nvidia graphics card is required. This setup significantly enhances the performance, ensuring a smoother and faster operation.

app/content/ENG/faq_discussion/discussion.md DELETED Viewed

@@ -1,7 +0,0 @@
-## Contact us
-If you have any questions, or suggestions for features or improvements, please don’t hesitate to contact us.
-- Open a discussion on [HuggingFace](https://huggingface.co/spaces/Riksarkivet/htr_demo/discussions).
-- Send an email to: forskning@riksarkivet.se

app/content/ENG/faq_discussion/faq.md DELETED Viewed

@@ -1,13 +0,0 @@
-## Frequently Asked Questions
-**Q**: <u>Is my data secure? Can I upload my own images?</u>
-**A**: Absolutely. Uploaded files are not saved or stored.
-**Q**: <u>Why am I always in a queue?</u>
-**A**: This is due to hardware constraints and rate limits imposed by Hugging Face. For alternative ways to use the app, refer to the tab > **Documentation** under > **Duplication for Own Use & API**.
-**Q**: <u>Why is Fast track so slow?</u>
-**A**: The current speed is due to hardware limitations and the present state of the code. However, we plan to update the application in future releases, which will significantly improve the performance of the application.
-**Q**: <u>Is it possible to run Fast track or the API on image batches?</u>
-**A**: Not currently, but we plan to implement this feature in the future.

app/content/ENG/htrflow/htrflow_col1.md DELETED Viewed

@@ -1,18 +0,0 @@
-## Introduction
-The Swedish National Archives introduces a demonstrational end-to-end HTR (Handwritten Text Recognition) pipeline. The pipeline consists of two instance segmentation models, one trained for segmenting text-regions within running-text document images, and another trained for segmenting text-lines within these regions. The text-lines are then transcribed by a text-recognition model trained on a vast set of swedish handwriting ranging from the 17th to the 19th century.
-## Usage
-It needs to be emphasized that this application is intended mainly for demo-purposes. Its aim is to showcase our pipeline for transcribing historical, running-text documents, not to put the pipeline into large-scale production.
-**Note**: In the future we’ll optimize the code to suit a production scenario with multi-GPU, batch-inference, but this is still a work in progress. <br>
-For an insight into the upcoming features we are working on:
-- Navigate to the > **Overview** > **Changelog & Roadmap**.
-## Limitations
-The demo, hosted on Huggingface and assigned a T4 GPU, can only handle two users submissions at a time. If you experience long wait times or unresponsiveness, this is the reason. In the future, we plan to host this solution ourselves, with a better server for an improved user experience, optimized code, and multiple model options. Exciting developments are on the horizon!
-It's also important to note that the models work on running text, not text in table format.

app/content/ENG/htrflow/htrflow_col2.md DELETED Viewed

@@ -1,23 +0,0 @@
-## Source Code
-Please fork and leave a star on Github if you like it! The code for this project can be found here:
-- [Github](https://github.com/Riksarkivet/HTRFLOW)
-**Note**: We will in the future package all of the code for mass HTR (batch inference on multi-GPU setup), but the code is still work in progress.
-## Models
-The models used in this demo are very much a work in progress, and as more data, and new architectures, becomes available, they will be retrained and reevaluated. For more information about the models, please refer to their model-cards on Huggingface.
-- [Riksarkivet/rtmdet_regions](https://huggingface.co/Riksarkivet/rtmdet_regions)
-- [Riksarkivet/rtmdet_lines](https://huggingface.co/Riksarkivet/rtmdet_lines)
-- [Riksarkivet/satrn_htr](https://huggingface.co/https://huggingface.co/Riksarkivet/satrn_htr)
-## Datasets
-Train and testsets created by the Swedish National Archives will be released here:
-- [Riksarkivet/placeholder_region_segmentation](https://huggingface.co/datasets/Riksarkivet/placeholder_region_segmentation)
-- [Riksarkivet/placeholder_line_segmentation](https://huggingface.co/datasets/Riksarkivet/placeholder_line_segmentation)
-- [Riksarkivet/placeholder_htr](https://huggingface.co/datasets/Riksarkivet/placeholder_htr)

app/content/ENG/htrflow/htrflow_row1.md DELETED Viewed

@@ -1,3 +0,0 @@
-## The Pipeline in Overview
-The steps in the pipeline can be seen below as follows:

app/content/ENG/htrflow/htrflow_tab1.md DELETED Viewed

@@ -1,7 +0,0 @@
-### Binarization
-The reason for binarizing the images before processing them is that we want the models to generalize as well as possible. By training on only binarized images and by binarizing images before running them through the pipeline, we take the target domain closer to the training domain, and reduce negative effects of background variation, background noise etc., on the final results. The pipeline implements a simple adaptive thresholding algorithm for binarization.
-<figure>
-<img src="https://github.com/Borg93/htr_gradio_file_placeholder/blob/main/app_project_bin.png?raw=true" alt="HTR_tool" style="width:70%; display: block; margin-left: auto; margin-right:auto;" >
-</figure>

app/content/ENG/htrflow/htrflow_tab2.md DELETED Viewed

@@ -1,7 +0,0 @@
-### Text-region segmentation
-To facilitate the text-line segmentation process, it is advantageous to segment the image into text-regions beforehand. This initial step offers several benefits, including reducing variations in line spacing, eliminating blank areas on the page, establishing a clear reading order, and distinguishing marginalia from the main text. The segmentation model utilized in this process predicts both bounding boxes and masks. Although the model has the capability to predict both, only the masks are utilized for the segmentation tasks of lines and regions. An essential post-processing step involves checking for regions that are contained within other regions. During this step, only the containing region is retained, while the contained region is discarded. This ensures that the final segmented text-regions are accurate and devoid of overlapping or redundant areas. This ensures that there’s no duplicate text-regions sent to the text-recognition model.
-<figure>
-<img src="https://github.com/Borg93/htr_gradio_file_placeholder/blob/main/app_project_region.png?raw=true" alt="HTR_tool" style="width:70%; display: block; margin-left: auto; margin-right:auto;" >
-</figure>

app/content/ENG/htrflow/htrflow_tab3.md DELETED Viewed

@@ -1,7 +0,0 @@
-### Text-line segmentation
-This is also an instance segmentation model, trained on extracting text-lines from the cropped text-regions. The same post-processing as in the text-region segmentation step, is done in the text-line segmentation step.
-<figure>
-<img src="https://github.com/Borg93/htr_gradio_file_placeholder/blob/main/app_project_line.png?raw=true" alt="HTR_tool" style="width:70%; display: block; margin-left: auto; margin-right:auto;" >
-</figure>

app/content/ENG/htrflow/htrflow_tab4.md DELETED Viewed

@@ -1,7 +0,0 @@
-### Text Recognition
-The text-recognition model was trained on approximately one million handwritten text-line images ranging from the 17th to the 19th century. See the model card for detailed evaluation results, and results from some fine-tuning experiments.
-<figure>
-<img src="https://github.com/Borg93/htr_gradio_file_placeholder/blob/main/app_project_htr.png?raw=true" alt="HTR_tool" style="width:70%; display: block; margin-left: auto; margin-right:auto;" >
-</figure>

app/content/NOR/htrflow/htrflow_col1.md DELETED Viewed

@@ -1,18 +0,0 @@
-### Introduktion
-Riksarkivet presenterar en demonstrationspipeline för HTR (Handwritten Text Recognition). Pipelinen består av två instanssegmenteringsmodeller: en tränad för att segmentera textregioner i bilder av löpande-textdokument och en annan tränad för att segmentera textrader inom dessa regioner. Textraderna transkriberas därefter av en textigenkänningsmodell som är tränad på ett stort dataset med svensk handskrift från 1600- till 1800-talet.
-### Användning
-Det är viktigt att betona att denna applikation främst är avsedd för demonstrationsändamål. Målet är att visa upp vår pipeline för att transkribera historiska dokument med löpande text, inte att använda pipelinen i storskalig produktion.
-**Obs**: I framtiden kommer vi att optimera koden för att passa ett produktionsscenario med multi-GPU och batch-inferens, men detta arbete pågår fortfarande. <br>
-För en inblick i de kommande funktionerna vi arbetar med:
-- Navigera till > **Översikt** > **Ändringslogg och roadmap**.
-### Begränsningar
-Demon, som är värd på Huggingface och tilldelad en T4 GPU, kan bara hantera två användarinlämningar åt gången. Om du upplever långa väntetider eller att applikationen inte svarar, är detta anledningen. I framtiden planerar vi att själva vara värdar för denna lösning, med en bättre server för en förbättrad användarupplevelse, optimerad kod och flera modellalternativ. Spännande utveckling är på gång!
-Det är också viktigt att notera att modellerna fungerar på löpande text och inte text i tabellformat.

app/content/NOR/htrflow/htrflow_col2.md DELETED Viewed

@@ -1,23 +0,0 @@
-## Source Code
-Please fork and leave a star on Github if you like it! The code for this project can be found here:
-- [Github](https://github.com/Riksarkivet/HTRFLOW)
-**Note**: We will in the future package all of the code for mass HTR (batch inference on multi-GPU setup), but the code is still work in progress.
-## Models
-The models used in this demo are very much a work in progress, and as more data, and new architectures, becomes available, they will be retrained and reevaluated. For more information about the models, please refer to their model-cards on Huggingface.
-- [Riksarkivet/rtmdet_regions](https://huggingface.co/Riksarkivet/rtmdet_regions)
-- [Riksarkivet/rtmdet_lines](https://huggingface.co/Riksarkivet/rtmdet_lines)
-- [Riksarkivet/satrn_htr](https://huggingface.co/https://huggingface.co/Riksarkivet/satrn_htr)
-## Datasets
-Train and testsets created by the Swedish National Archives will be released here:
-- [Riksarkivet/placeholder_region_segmentation](https://huggingface.co/datasets/Riksarkivet/placeholder_region_segmentation)
-- [Riksarkivet/placeholder_line_segmentation](https://huggingface.co/datasets/Riksarkivet/placeholder_line_segmentation)
-- [Riksarkivet/placeholder_htr](https://huggingface.co/datasets/Riksarkivet/placeholder_htr)

app/content/NOR/htrflow/htrflow_row1.md DELETED Viewed

@@ -1,3 +0,0 @@
-## The Pipeline in Overview
-The steps in the pipeline can be seen below as follows:

app/content/NOR/htrflow/htrflow_tab1.md DELETED Viewed

@@ -1,7 +0,0 @@
-### Binarization
-The reason for binarizing the images before processing them is that we want the models to generalize as well as possible. By training on only binarized images and by binarizing images before running them through the pipeline, we take the target domain closer to the training domain, and reduce negative effects of background variation, background noise etc., on the final results. The pipeline implements a simple adaptive thresholding algorithm for binarization.
-<figure>
-<img src="https://github.com/Borg93/htr_gradio_file_placeholder/blob/main/app_project_bin.png?raw=true" alt="HTR_tool" style="width:70%; display: block; margin-left: auto; margin-right:auto;" >
-</figure>

app/content/NOR/htrflow/htrflow_tab2.md DELETED Viewed

@@ -1,7 +0,0 @@
-### Text-region segmentation
-To facilitate the text-line segmentation process, it is advantageous to segment the image into text-regions beforehand. This initial step offers several benefits, including reducing variations in line spacing, eliminating blank areas on the page, establishing a clear reading order, and distinguishing marginalia from the main text. The segmentation model utilized in this process predicts both bounding boxes and masks. Although the model has the capability to predict both, only the masks are utilized for the segmentation tasks of lines and regions. An essential post-processing step involves checking for regions that are contained within other regions. During this step, only the containing region is retained, while the contained region is discarded. This ensures that the final segmented text-regions are accurate and devoid of overlapping or redundant areas. This ensures that there’s no duplicate text-regions sent to the text-recognition model.
-<figure>
-<img src="https://github.com/Borg93/htr_gradio_file_placeholder/blob/main/app_project_region.png?raw=true" alt="HTR_tool" style="width:70%; display: block; margin-left: auto; margin-right:auto;" >
-</figure>

app/content/NOR/htrflow/htrflow_tab3.md DELETED Viewed

@@ -1,7 +0,0 @@
-### Text-line segmentation
-This is also an instance segmentation model, trained on extracting text-lines from the cropped text-regions. The same post-processing as in the text-region segmentation step, is done in the text-line segmentation step.
-<figure>
-<img src="https://github.com/Borg93/htr_gradio_file_placeholder/blob/main/app_project_line.png?raw=true" alt="HTR_tool" style="width:70%; display: block; margin-left: auto; margin-right:auto;" >
-</figure>

app/content/NOR/htrflow/htrflow_tab4.md DELETED Viewed

@@ -1,7 +0,0 @@
-### Text Recognition
-The text-recognition model was trained on approximately one million handwritten text-line images ranging from the 17th to the 19th century. See the model card for detailed evaluation results, and results from some fine-tuning experiments.
-<figure>
-<img src="https://github.com/Borg93/htr_gradio_file_placeholder/blob/main/app_project_htr.png?raw=true" alt="HTR_tool" style="width:70%; display: block; margin-left: auto; margin-right:auto;" >
-</figure>

app/content/SWE/htrflow/htrflow_col1.md DELETED Viewed

@@ -1,18 +0,0 @@
-### Introduktion
-Riksarkivet presenterar en demonstrationspipeline för HTR (Handwritten Text Recognition). Pipelinen består av två instanssegmenteringsmodeller: en tränad för att segmentera textregioner i bilder av löpande-textdokument och en annan tränad för att segmentera textrader inom dessa regioner. Textraderna transkriberas därefter av en textigenkänningsmodell som är tränad på ett stort dataset med svensk handskrift från 1600- till 1800-talet.
-### Användning
-Det är viktigt att betona att denna applikation främst är avsedd för demonstrationsändamål. Målet är att visa upp vår pipeline för att transkribera historiska dokument med löpande text, inte att använda pipelinen i storskalig produktion.
-**Obs**: I framtiden kommer vi att optimera koden för att passa ett produktionsscenario med multi-GPU och batch-inferens, men detta arbete pågår fortfarande. <br>
-För en inblick i de kommande funktionerna vi arbetar med:
-- Navigera till > **Översikt** > **Ändringslogg och roadmap**.
-### Begränsningar
-Demon, som är värd på Huggingface och tilldelad en T4 GPU, kan bara hantera två användarinlämningar åt gången. Om du upplever långa väntetider eller att applikationen inte svarar, är detta anledningen. I framtiden planerar vi att själva vara värdar för denna lösning, med en bättre server för en förbättrad användarupplevelse, optimerad kod och flera modellalternativ. Spännande utveckling är på gång!
-Det är också viktigt att notera att modellerna fungerar på löpande text och inte text i tabellformat.

app/content/SWE/htrflow/htrflow_col2.md DELETED Viewed

@@ -1,23 +0,0 @@
-## Source Code
-Please fork and leave a star on Github if you like it! The code for this project can be found here:
-- [Github](https://github.com/Riksarkivet/HTRFLOW)
-**Note**: We will in the future package all of the code for mass HTR (batch inference on multi-GPU setup), but the code is still work in progress.
-## Models
-The models used in this demo are very much a work in progress, and as more data, and new architectures, becomes available, they will be retrained and reevaluated. For more information about the models, please refer to their model-cards on Huggingface.
-- [Riksarkivet/rtmdet_regions](https://huggingface.co/Riksarkivet/rtmdet_regions)
-- [Riksarkivet/rtmdet_lines](https://huggingface.co/Riksarkivet/rtmdet_lines)
-- [Riksarkivet/satrn_htr](https://huggingface.co/https://huggingface.co/Riksarkivet/satrn_htr)
-## Datasets
-Train and testsets created by the Swedish National Archives will be released here:
-- [Riksarkivet/placeholder_region_segmentation](https://huggingface.co/datasets/Riksarkivet/placeholder_region_segmentation)
-- [Riksarkivet/placeholder_line_segmentation](https://huggingface.co/datasets/Riksarkivet/placeholder_line_segmentation)
-- [Riksarkivet/placeholder_htr](https://huggingface.co/datasets/Riksarkivet/placeholder_htr)

app/content/SWE/htrflow/htrflow_row1.md DELETED Viewed

@@ -1,3 +0,0 @@
-## The Pipeline in Overview
-The steps in the pipeline can be seen below as follows:

app/content/SWE/htrflow/htrflow_tab1.md DELETED Viewed

@@ -1,7 +0,0 @@
-### Binarization
-The reason for binarizing the images before processing them is that we want the models to generalize as well as possible. By training on only binarized images and by binarizing images before running them through the pipeline, we take the target domain closer to the training domain, and reduce negative effects of background variation, background noise etc., on the final results. The pipeline implements a simple adaptive thresholding algorithm for binarization.
-<figure>
-<img src="https://github.com/Borg93/htr_gradio_file_placeholder/blob/main/app_project_bin.png?raw=true" alt="HTR_tool" style="width:70%; display: block; margin-left: auto; margin-right:auto;" >
-</figure>

app/content/SWE/htrflow/htrflow_tab2.md DELETED Viewed

@@ -1,7 +0,0 @@
-### Text-region segmentation
-To facilitate the text-line segmentation process, it is advantageous to segment the image into text-regions beforehand. This initial step offers several benefits, including reducing variations in line spacing, eliminating blank areas on the page, establishing a clear reading order, and distinguishing marginalia from the main text. The segmentation model utilized in this process predicts both bounding boxes and masks. Although the model has the capability to predict both, only the masks are utilized for the segmentation tasks of lines and regions. An essential post-processing step involves checking for regions that are contained within other regions. During this step, only the containing region is retained, while the contained region is discarded. This ensures that the final segmented text-regions are accurate and devoid of overlapping or redundant areas. This ensures that there’s no duplicate text-regions sent to the text-recognition model.
-<figure>
-<img src="https://github.com/Borg93/htr_gradio_file_placeholder/blob/main/app_project_region.png?raw=true" alt="HTR_tool" style="width:70%; display: block; margin-left: auto; margin-right:auto;" >
-</figure>

app/content/SWE/htrflow/htrflow_tab3.md DELETED Viewed

@@ -1,7 +0,0 @@
-### Text-line segmentation
-This is also an instance segmentation model, trained on extracting text-lines from the cropped text-regions. The same post-processing as in the text-region segmentation step, is done in the text-line segmentation step.
-<figure>
-<img src="https://github.com/Borg93/htr_gradio_file_placeholder/blob/main/app_project_line.png?raw=true" alt="HTR_tool" style="width:70%; display: block; margin-left: auto; margin-right:auto;" >
-</figure>

app/content/SWE/htrflow/htrflow_tab4.md DELETED Viewed

@@ -1,7 +0,0 @@
-### Text Recognition
-The text-recognition model was trained on approximately one million handwritten text-line images ranging from the 17th to the 19th century. See the model card for detailed evaluation results, and results from some fine-tuning experiments.
-<figure>
-<img src="https://github.com/Borg93/htr_gradio_file_placeholder/blob/main/app_project_htr.png?raw=true" alt="HTR_tool" style="width:70%; display: block; margin-left: auto; margin-right:auto;" >
-</figure>

app/gradio_config.py CHANGED Viewed

@@ -13,12 +13,5 @@ theme = gr.themes.Default(
 )
 css = """
-body > gradio-app > div > div > div.wrap.svelte-1rjryqp > footer > a {
-    display: none !important;
-}
-body > gradio-app > div > div > div.wrap.svelte-1rjryqp > footer > div {
-    display: none !important;
-}
-#langdropdown {width: 100px;}
 """

 )
 css = """
 """

app/main.py CHANGED Viewed

@@ -1,97 +1,38 @@
-import logging
 import gradio as gr
 from app.gradio_config import css, theme
 from app.tabs.adv_htrflow_tab import adv_htrflow_pipeline
-from app.tabs.data_explorer_tab import data_explorer
 from app.tabs.examples_tab import examples
-from app.tabs.htrflow_tab import htrflow_pipeline
-from app.tabs.overview_tab import overview, overview_language
-from app.utils.lang_helper import get_tab_updates
 from app.utils.md_helper import load_markdown
-logger = logging.getLogger("gradio_log")
-TAB_LABELS = {
-    "ENG": ["Home", "Simple", "Advanced", "Examples"],
-    "SWE": ["Hem", "Enkel", "Avancerad", "Exempel"],
-}
-LANG_CHOICES = ["ENG", "SWE"]
 with gr.Blocks(title="HTRflow", theme=theme, css=css) as demo:
     with gr.Row():
-        local_language = gr.BrowserState(
-            default_value="ENG", storage_key="selected_language"
-        )
-        main_language = gr.State(value="ENG")
         with gr.Column(scale=1):
-            language_selector = gr.Dropdown(
-                choices=LANG_CHOICES,
-                value="ENG",
-                container=False,
-                min_width=50,
-                scale=0,
-                elem_id="langdropdown",
-            )
         with gr.Column(scale=2):
             gr.Markdown(load_markdown(None, "main_title"))
         with gr.Column(scale=1):
             gr.Markdown(load_markdown(None, "main_sub_title"))
     with gr.Tabs(elem_classes="top-navbar") as navbar:
-        with gr.Tab(label="Home") as tab_home:
-            overview.render()
-        with gr.Tab(label="Simple") as tab_simple_htr:
-            htrflow_pipeline.render()
-        with gr.Tab(label="Advanced") as tab_custom_htr:
             adv_htrflow_pipeline.render()
-        with gr.Tab(label="Examples") as tab_examples:
             examples.render()
-        # with gr.Tab(label="Data Explorer") as tab_data_explorer:
-        #     data_explorer.render()
-    @demo.load(
-        inputs=[local_language],
-        outputs=[language_selector, main_language, overview_language],
-    )
-    def load_language(saved_values):
-        return (saved_values,) * 3
-    @language_selector.change(
-        inputs=[language_selector],
-        outputs=[
-            local_language,
-            main_language,
-            overview_language,
-        ],
-    )
-    def save_language_to_browser(selected_language):
-        return (selected_language,) * 3
-    @main_language.change(
-        inputs=[main_language],
-        outputs=[
-            tab_home,
-            tab_simple_htr,
-            tab_custom_htr,
-        ],
-    )
-    def update_main_tabs(selected_language):
-        return (*get_tab_updates(selected_language, TAB_LABELS),)
-    @main_language.change(inputs=[main_language])
-    def log_on_language_change(selected_language):
-        logger.info(f"Language changed to: {selected_language}")
 demo.queue()

 import gradio as gr
 from app.gradio_config import css, theme
 from app.tabs.adv_htrflow_tab import adv_htrflow_pipeline
 from app.tabs.examples_tab import examples
+from app.tabs.templating import (
+    templating_block,
+    template_image_folder,
+    template_yaml_folder,
+)
 from app.utils.md_helper import load_markdown
+gr.set_static_paths(paths=[template_image_folder])
+gr.set_static_paths(paths=[template_yaml_folder])
 with gr.Blocks(title="HTRflow", theme=theme, css=css) as demo:
     with gr.Row():
         with gr.Column(scale=1):
+            pass
         with gr.Column(scale=2):
             gr.Markdown(load_markdown(None, "main_title"))
         with gr.Column(scale=1):
             gr.Markdown(load_markdown(None, "main_sub_title"))
     with gr.Tabs(elem_classes="top-navbar") as navbar:
+        with gr.Tab(label="Templating") as tab_templating:
+            templating_block.render()
+        with gr.Tab(label="Submit Job") as tab_submit_job:
             adv_htrflow_pipeline.render()
+        with gr.Tab(label="Output & Visualize") as tab_examples:
             examples.render()
 demo.queue()

app/plot_viewer.py DELETED Viewed

@@ -1,200 +0,0 @@
-import xml.etree.ElementTree as ET
-from io import BytesIO
-import cv2
-import gradio as gr
-import numpy as np
-import requests
-from PIL import Image
-def parse_alto_xml(xml_file):
-    """Parse the ALTO XML file to extract polygons and text content for each TextLine."""
-    tree = ET.parse(xml_file)
-    root = tree.getroot()
-    ns = {"alto": "http://www.loc.gov/standards/alto/ns-v4#"}
-    annotations = []
-    transcriptions = {}
-    for text_block in root.findall(".//alto:TextBlock", ns):
-        for text_line in text_block.findall("alto:TextLine", ns):
-            shape = text_line.find("alto:Shape", ns)
-            if shape is not None:
-                polygon = shape.find("alto:Polygon", ns)
-                if polygon is not None:
-                    polygon_points = polygon.attrib["POINTS"]
-                    points = [
-                        tuple(map(int, point.split(",")))
-                        for point in polygon_points.split()
-                    ]
-            else:
-                hpos = int(text_line.attrib["HPOS"])
-                vpos = int(text_line.attrib["VPOS"])
-                width = int(text_line.attrib["WIDTH"])
-                height = int(text_line.attrib["HEIGHT"])
-                points = [
-                    (hpos, vpos),
-                    (hpos + width, vpos),
-                    (hpos + width, vpos + height),
-                    (hpos, vpos + height),
-                ]
-            content = " ".join(
-                [
-                    string.attrib["CONTENT"]
-                    for string in text_line.findall("alto:String", ns)
-                ]
-            )
-            label = text_line.attrib["ID"]
-            annotations.append((points, label))
-            transcriptions[label] = content
-    text_area_content = "\n".join(transcriptions[label] for label in transcriptions)
-    return annotations, transcriptions, text_area_content
-def visualize_polygons_on_image(
-    image, annotations, alpha=0.5, include_reading_order=False
-):
-    """Visualize polygons on the image with an optional reading order overlay."""
-    overlay = image.copy()
-    for _, (polygon, label) in enumerate(annotations):
-        color = (
-            np.random.randint(0, 255),
-            np.random.randint(0, 255),
-            np.random.randint(0, 255),
-        )
-        cv2.fillPoly(overlay, [np.array(polygon, dtype=np.int32)], color)
-        if include_reading_order:
-            centroid = np.mean(np.array(polygon), axis=0).astype(int)
-            cv2.putText(
-                overlay,
-                str(label),
-                tuple(centroid),
-                cv2.FONT_HERSHEY_SIMPLEX,
-                0.5,
-                (0, 0, 0),
-                1,
-                cv2.LINE_AA,
-            )
-    return cv2.addWeighted(overlay, alpha, image, 1 - alpha, 0)
-def visualize(
-    xml_file, image_source, image_id, uploaded_image, include_reading_order=False
-):
-    if image_source == "Use IIIF image":
-        if not image_id:
-            raise gr.Error("Please enter an Image ID.")
-        image_url = f"https://iiifintern.ra.se/arkis!{image_id}/full/max/0/default.jpg"
-        response = requests.get(image_url)
-        if response.status_code != 200:
-            raise gr.Error(f"Failed to download image from {image_url}")
-        image = np.array(Image.open(BytesIO(response.content)))
-    else:
-        if uploaded_image is None:
-            raise gr.Error("Please upload an image.")
-        image = uploaded_image
-    annotations, transcriptions, text_area_content = parse_alto_xml(xml_file)
-    annotated_image = visualize_polygons_on_image(
-        image, annotations, include_reading_order=include_reading_order
-    )
-    return annotated_image, annotations, transcriptions, text_area_content
-def get_transcription_from_coords(annotations, transcriptions, evt: gr.SelectData):
-    """Get the transcription for the polygon clicked in the annotated image."""
-    x, y = evt.index[0], evt.index[1]
-    for points, label in annotations:
-        polygon = np.array(points, dtype=np.int32)
-        if cv2.pointPolygonTest(polygon, (x, y), False) >= 0:
-            return transcriptions.get(label, "No transcription available.")
-    return "No transcription available."
-with gr.Blocks(title="XML Visualization App") as app:
-    with gr.Tab("Visualize"):
-        annotations_state = gr.State()
-        transcriptions_state = gr.State()
-        with gr.Row():
-            with gr.Column():
-                xml_input = gr.File(label="Upload ALTO XML File", file_types=[".xml"])
-            with gr.Column():
-                image_source = gr.Radio(
-                    choices=["Use IIIF image", "Upload your own image"],
-                    label="Image Source",
-                    value="Use IIIF image",
-                )
-                image_id_input = gr.Textbox(
-                    label="Image ID",
-                    placeholder="Enter image ID (e.g., 30003365_00001)",
-                    visible=True,
-                )
-                image_upload = gr.Image(
-                    label="Upload Image", type="numpy", visible=False
-                )
-                include_reading_order_input = gr.Checkbox(label="Include Reading Order")
-                process_button = gr.Button("Visualize Alto", scale=0, variant="primary")
-        def update_image_source(choice):
-            if choice == "Use IIIF image":
-                return [gr.update(visible=True), gr.update(visible=False)]
-            else:
-                return [gr.update(visible=False), gr.update(visible=True)]
-        image_source.change(
-            update_image_source,
-            inputs=image_source,
-            outputs=[image_id_input, image_upload],
-        )
-        with gr.Row():
-            with gr.Column(scale=3):
-                annotated_image_output = gr.Image(
-                    label="Annotated Image", interactive=True
-                )
-            with gr.Column(scale=2):
-                transcription_output = gr.TextArea(
-                    label="Transcription",
-                    interactive=False,
-                    show_copy_button=True,
-                    lines=30,
-                )
-                transcription_selected = gr.Textbox(
-                    label="Selected Polygon", interactive=False, show_copy_button=True
-                )
-        process_button.click(
-            visualize,
-            inputs=[
-                xml_input,
-                image_source,
-                image_id_input,
-                image_upload,
-                include_reading_order_input,
-            ],
-            outputs=[
-                annotated_image_output,
-                annotations_state,
-                transcriptions_state,
-                transcription_output,
-            ],
-        )
-        annotated_image_output.select(
-            get_transcription_from_coords,
-            inputs=[annotations_state, transcriptions_state],
-            outputs=transcription_selected,
-        )
-app.queue()
-app.launch()

app/tabs/adv_htrflow_tab.py CHANGED Viewed

@@ -1,35 +1,22 @@
-import time
 import gradio as gr
 with gr.Blocks() as adv_htrflow_pipeline:
     with gr.Row(variant="panel"):
         with gr.Column(scale=3):
-            image_mask2 = gr.ImageEditor(
-                label="Uploaded image",
-                sources="upload",
-                interactive=True,
-                layers=False,
-                eraser=False,
-                brush=False,
-                height=400,
-                transforms="crop",
-                crop_size="16,5",
-                visible=False,
-            )
-            image_mask = gr.Gallery(
                 file_types=["image"],
                 label="Upload images",
                 interactive=True,
-                height=400,
                 object_fit="cover",
                 columns=5,
             )
             with gr.Row(visible=True) as yaml_pipeline:
                 with gr.Accordion(label="Run Template", open=False):
-                    gr.Checkbox(value=True, label="Batch", container=False, scale=0)
                     custom_template_yaml = gr.Code(
                         value="Paste your custom pipeline here",
                         language="yaml",
@@ -58,7 +45,11 @@ with gr.Blocks() as adv_htrflow_pipeline:
                         info="Checkboxgroup should be basedon output structure from htrflow",
                     )
-                    gr.Image(interactive=False)
                 with gr.Tab("Table"):
                     pass
@@ -67,6 +58,7 @@ with gr.Blocks() as adv_htrflow_pipeline:
                     pass
         def foo():
             return gr.update(visible=True), "test"
         click_event = run_button.click(
@@ -79,21 +71,3 @@ with gr.Blocks() as adv_htrflow_pipeline:
             outputs=cancel_button,
             cancels=[click_event],
         )
-        image_mask2.upload(
-            fn=None,
-            inputs=None,
-            outputs=None,
-            js="""
-            () => {
-                // Target the button using its attributes
-                const button = document.querySelector('button[aria-label="Transform button"][title="Transform button"]');
-                if (button) {
-                    button.click(); // Simulate a click
-                    console.log('Transform button clicked.');
-                } else {
-                    console.error('Transform button not found.');
-                }
-            }
-            """,
-        ).then(fn=lambda: gr.update(crop=None), inputs=None, outputs=image_mask2)

 import gradio as gr
 with gr.Blocks() as adv_htrflow_pipeline:
     with gr.Row(variant="panel"):
         with gr.Column(scale=3):
+            image_batch_input = gr.Gallery(
                 file_types=["image"],
                 label="Upload images",
                 interactive=True,
                 object_fit="cover",
+                preview=True,
                 columns=5,
             )
             with gr.Row(visible=True) as yaml_pipeline:
                 with gr.Accordion(label="Run Template", open=False):
                     custom_template_yaml = gr.Code(
                         value="Paste your custom pipeline here",
                         language="yaml",
                         info="Checkboxgroup should be basedon output structure from htrflow",
                     )
+                    gr.Image(
+                        interactive=False,
+                        show_fullscreen_button=True,
+                        show_share_button=True,
+                    )
                 with gr.Tab("Table"):
                     pass
                     pass
         def foo():
+            gr.Info("hello morgan")
             return gr.update(visible=True), "test"
         click_event = run_button.click(
             outputs=cancel_button,
             cancels=[click_event],
         )