Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
23 commits
Select commit Hold shift + click to select a range
004e34c
first commit; restructured python directories to work together among …
AlekSimpson Mar 20, 2025
8d38857
test commit
AlekSimpson Mar 20, 2025
b599da1
added more to the demo testfile and added API reference docs
AlekSimpson Mar 20, 2025
1841c81
fixes
AlekSimpson Mar 27, 2025
725a31f
modulize the semantic file and add a preprocess pipeline
torahoang Mar 31, 2025
f885ce5
modulize the semantic file and add a preprocess pipeline
torahoang Apr 1, 2025
6481a47
fixes
AlekSimpson Apr 1, 2025
fcb2e20
preprocess change
torahoang Apr 8, 2025
a0be4c2
preprocess add simthres default
torahoang Apr 8, 2025
2a94da8
added llm powered semantic comparison (still in beta, needs improveme…
AlekSimpson Apr 19, 2025
a515a97
Create x
patilraje Apr 23, 2025
287f312
Add files via upload
patilraje Apr 23, 2025
9f4d36d
Delete T5-finetuned/x
patilraje Apr 23, 2025
6a76503
implement the agree upon IO schema
torahoang Apr 27, 2025
ec46754
Merge branch 'cidse2025' into preprocessing
torahoang Apr 27, 2025
933ef4f
resolve conflict with cidse2025
torahoang Apr 27, 2025
43da156
changes process_comparison_request to perform_semantic_comparison
torahoang Apr 27, 2025
efb2f88
llm comparison works good enough now, suggested edit position output …
AlekSimpson Apr 27, 2025
c129b59
Merge branch 'modelT5' into cidse2025
AlekSimpson May 9, 2025
99c4531
Merge pull request #6 from grey-box/cidse2025
AlekSimpson May 9, 2025
2e3dfca
Merge branch 'main' into cidse2025-llm_comp_upgrades
francois-pelletier-greybox Aug 10, 2025
ab12c03
updated the requirements.txt
Aug 10, 2025
e791c32
Fix/pytest GitHub actions (#9)
franc00018 Aug 10, 2025
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
26 changes: 20 additions & 6 deletions .github/workflows/main.yml
Original file line number Diff line number Diff line change
Expand Up @@ -3,30 +3,44 @@ run-name: ${{ github.actor }} is building symmetry 🚀
on: [push]
jobs:
Test_API_endpoints:
runs-on: windows-latest
runs-on: ubuntu-latest
steps:
- name: Checkout repository
uses: actions/checkout@v4

- name: Set up Python
uses: actions/setup-python@v4
with:
python-version: '3.11.8'
python-version: '3.13'

- name: Install dependencies
run: |
python -m pip install --upgrade pip
cd fastapi/
cd backend-fastapi/
pip install -r requirements.txt
python -m nltk.downloader punkt
echo "=== Installed packages ==="
pip list
echo "=== Current directory ==="
pwd
echo "=== Python path ==="
python -c "import sys; print('\n'.join(sys.path))"
echo "=== Checking pytest installation ==="
python -c "import pytest; print('pytest version:', pytest.__version__)"

- name: Run Pytest
run: python -m pytest
run: |
echo "=== Running pytest from backend-fastapi directory ==="
cd backend-fastapi/
python -m pytest

- name: Install PyInstaller
run: pip install pyinstaller

- name: Build with PyInstaller
run: pyinstaller -F api/flaskr/pyapp.py

run: |
echo "=== Running PyInstaller from backend-fastapi directory ==="
cd backend-fastapi/app/
pyinstaller -F main.py

- run: echo "🎉 The job was automatically triggered by a ${{ github.event_name }} event."
49 changes: 0 additions & 49 deletions LLM/semantic_comparison.py

This file was deleted.

60 changes: 60 additions & 0 deletions T5-finetuned/config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,60 @@
{
"architectures": [
"T5ForConditionalGeneration"
],
"classifier_dropout": 0.0,
"d_ff": 2048,
"d_kv": 64,
"d_model": 512,
"decoder_start_token_id": 0,
"dense_act_fn": "relu",
"dropout_rate": 0.1,
"eos_token_id": 1,
"feed_forward_proj": "relu",
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"is_gated_act": false,
"layer_norm_epsilon": 1e-06,
"model_type": "t5",
"n_positions": 512,
"num_decoder_layers": 6,
"num_heads": 8,
"num_layers": 6,
"output_past": true,
"pad_token_id": 0,
"relative_attention_max_distance": 128,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 200,
"min_length": 30,
"no_repeat_ngram_size": 3,
"num_beams": 4,
"prefix": "summarize: "
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to German: "
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to French: "
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to Romanian: "
}
},
"torch_dtype": "float32",
"transformers_version": "4.51.3",
"use_cache": true,
"vocab_size": 32128
}
7 changes: 7 additions & 0 deletions T5-finetuned/generation_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,7 @@
{
"_from_model_config": true,
"decoder_start_token_id": 0,
"eos_token_id": 1,
"pad_token_id": 0,
"transformers_version": "4.51.3"
}
125 changes: 125 additions & 0 deletions T5-finetuned/special_tokens_map.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,125 @@
{
"additional_special_tokens": [
"<extra_id_0>",
"<extra_id_1>",
"<extra_id_2>",
"<extra_id_3>",
"<extra_id_4>",
"<extra_id_5>",
"<extra_id_6>",
"<extra_id_7>",
"<extra_id_8>",
"<extra_id_9>",
"<extra_id_10>",
"<extra_id_11>",
"<extra_id_12>",
"<extra_id_13>",
"<extra_id_14>",
"<extra_id_15>",
"<extra_id_16>",
"<extra_id_17>",
"<extra_id_18>",
"<extra_id_19>",
"<extra_id_20>",
"<extra_id_21>",
"<extra_id_22>",
"<extra_id_23>",
"<extra_id_24>",
"<extra_id_25>",
"<extra_id_26>",
"<extra_id_27>",
"<extra_id_28>",
"<extra_id_29>",
"<extra_id_30>",
"<extra_id_31>",
"<extra_id_32>",
"<extra_id_33>",
"<extra_id_34>",
"<extra_id_35>",
"<extra_id_36>",
"<extra_id_37>",
"<extra_id_38>",
"<extra_id_39>",
"<extra_id_40>",
"<extra_id_41>",
"<extra_id_42>",
"<extra_id_43>",
"<extra_id_44>",
"<extra_id_45>",
"<extra_id_46>",
"<extra_id_47>",
"<extra_id_48>",
"<extra_id_49>",
"<extra_id_50>",
"<extra_id_51>",
"<extra_id_52>",
"<extra_id_53>",
"<extra_id_54>",
"<extra_id_55>",
"<extra_id_56>",
"<extra_id_57>",
"<extra_id_58>",
"<extra_id_59>",
"<extra_id_60>",
"<extra_id_61>",
"<extra_id_62>",
"<extra_id_63>",
"<extra_id_64>",
"<extra_id_65>",
"<extra_id_66>",
"<extra_id_67>",
"<extra_id_68>",
"<extra_id_69>",
"<extra_id_70>",
"<extra_id_71>",
"<extra_id_72>",
"<extra_id_73>",
"<extra_id_74>",
"<extra_id_75>",
"<extra_id_76>",
"<extra_id_77>",
"<extra_id_78>",
"<extra_id_79>",
"<extra_id_80>",
"<extra_id_81>",
"<extra_id_82>",
"<extra_id_83>",
"<extra_id_84>",
"<extra_id_85>",
"<extra_id_86>",
"<extra_id_87>",
"<extra_id_88>",
"<extra_id_89>",
"<extra_id_90>",
"<extra_id_91>",
"<extra_id_92>",
"<extra_id_93>",
"<extra_id_94>",
"<extra_id_95>",
"<extra_id_96>",
"<extra_id_97>",
"<extra_id_98>",
"<extra_id_99>"
],
"eos_token": {
"content": "</s>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false
},
"pad_token": {
"content": "<pad>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false
},
"unk_token": {
"content": "<unk>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false
}
}
Binary file added T5-finetuned/spiece.model
Binary file not shown.
Loading