Király Zoltán commited on
Commit
a245fbf
·
1 Parent(s): 2c2b98f

Fix: Clean up requirements.txt to resolve build conflicts

Browse files
.github/workflows/secret-tester.yml CHANGED
@@ -1,20 +1,34 @@
1
- name: "Titkok Tesztelése"
 
2
  on:
3
  workflow_dispatch:
 
4
  jobs:
5
- test-secrets-job:
6
  runs-on: ubuntu-latest
7
  steps:
8
  - name: "Repository letöltése"
9
  uses: actions/checkout@v4
10
- - name: "Python beállítása"
 
11
  uses: actions/setup-python@v5
12
  with:
13
  python-version: '3.10'
14
- - name: "Titkok ellenőrzése a Python szkripttel"
15
- run: python test_secrets.py
 
 
 
 
 
 
 
 
 
 
 
 
16
  env:
17
- ES_API_KEY_FROM_WORKFLOW: ${{ secrets.ES_API_KEY }}
18
- ES_CLOUD_ID_FROM_WORKFLOW: ${{ secrets.ES_CLOUD_ID }}
19
- PAT_FROM_WORKFLOW: ${{ secrets.PAT }}
20
- TOGETHER_API_KEY_FROM_WORKFLOW: ${{ secrets.TOGETHER_API_KEY }}
 
1
+ name: "Weboldal Indexelő Futtatása"
2
+
3
  on:
4
  workflow_dispatch:
5
+
6
  jobs:
7
+ build-and-index:
8
  runs-on: ubuntu-latest
9
  steps:
10
  - name: "Repository letöltése"
11
  uses: actions/checkout@v4
12
+
13
+ - name: "Python 3.10 beállítása és gyorsítótár használata"
14
  uses: actions/setup-python@v5
15
  with:
16
  python-version: '3.10'
17
+ cache: 'pip'
18
+
19
+ - name: "Build tools telepítése (a C alapú csomagokhoz)"
20
+ run: |
21
+ sudo apt-get update
22
+ sudo apt-get install -y build-essential python3-dev
23
+
24
+ - name: "Függőségek telepítése"
25
+ run: |
26
+ python -m pip install --upgrade pip
27
+ pip install -r requirements.txt
28
+
29
+ - name: "Indexer script futtatása"
30
+ run: python web_indexer_universal_v7.py
31
  env:
32
+ ES_CLOUD_ID: ${{ secrets.ES_CLOUD_ID }}
33
+ ES_API_KEY: ${{ secrets.ES_API_KEY }}
34
+ TOGETHER_API_KEY: ${{ secrets.TOGETHER_API_KEY }}
 
requirements.txt CHANGED
@@ -1,249 +1,9 @@
1
- absl-py
2
- aiohappyeyeballs
3
- aiohttp
4
- aiolimiter
5
- aiosignal
6
- albucore
7
- albumentations
8
- altair
9
- annotated-types
10
- anyio
11
- astor
12
- astunparse
13
- attrs
14
- banks
15
- beautifulsoup4
16
- blinker
17
- blis
18
- boto3
19
- botocore
20
- cachelib
21
- cachetools
22
- catalogue
23
- certifi
24
- cffi
25
- charset-normalizer
26
- click
27
- cloudpathlib
28
- colorama
29
- confection
30
- contourpy
31
- cryptography
32
- cycler
33
- cymem
34
- Cython
35
- dataclasses-json
36
- decorator
37
- deep-translator
38
- Deprecated
39
- dirtyjson
40
- docopt
41
- easyocr
42
- elastic-transport
43
  elasticsearch
44
- et_xmlfile
45
- eval_type_backport
46
- filelock
47
- filetype
48
- fire
49
- Flask
50
- Flask-Cors
51
- Flask-Session
52
- flatbuffers
53
- fonttools
54
- frozenlist
55
- fsspec
56
- gast
57
- gitdb
58
- GitPython
59
- google-ai-generativelanguage
60
- google-api-core
61
- google-api-python-client
62
- google-auth
63
- google-auth-httplib2
64
- google-cloud-core
65
- google-cloud-speech
66
- google-cloud-storage
67
- google-crc32c
68
- google-generativeai
69
- google-pasta
70
- google-resumable-media
71
- googleapis-common-protos
72
- greenlet
73
- griffe
74
- grpcio
75
- grpcio-status
76
- h11
77
- h5py
78
- httpcore
79
- httplib2
80
- httpx
81
- httpx-sse
82
- huggingface-hub
83
- ibm-cloud-sdk-core
84
- ibm-cos-sdk
85
- ibm-cos-sdk-core
86
- ibm-cos-sdk-s3transfer
87
- ibm-generative-ai
88
- ibm-watson
89
- idna
90
- imageio
91
- itsdangerous
92
- Jinja2
93
- jmespath
94
- joblib
95
- jsonschema
96
- jsonschema-specifications
97
- keras
98
- keybert
99
- kiwisolver
100
- langcodes
101
- language_data
102
- lazy_loader
103
- Levenshtein
104
- libclang
105
- llama-index-core
106
- llama-index-embeddings-huggingface
107
- lmdb
108
- lxml
109
- marisa-trie
110
- Markdown
111
- markdown-it-py
112
- MarkupSafe
113
- marshmallow
114
- matplotlib
115
- mdurl
116
- ml_dtypes
117
- mosestokenizer
118
- mpmath
119
- msgspec
120
- multidict
121
- murmurhash
122
- mypy-extensions
123
- namex
124
- narwhals
125
- nest-asyncio
126
- networkx
127
- ninja
128
- nltk
129
- numpy
130
- opencv-contrib-python
131
- opencv-python
132
- opencv-python-headless
133
- openfile
134
- openpyxl
135
- opt-einsum
136
- optree
137
- outcome
138
- packaging
139
- paddleocr
140
- paddlepaddle
141
- pandas
142
- pdf2image
143
- pdfminer.six
144
- pdfplumber
145
- pillow
146
- platformdirs
147
- preshed
148
- propcache
149
- proto-plus
150
- protobuf
151
- pyarrow
152
- pyasn1
153
- pyasn1_modules
154
- pyclipper
155
- pycparser
156
- pydantic
157
- pydantic_core
158
- pydeck
159
- pydub
160
- Pygments
161
- PyJWT
162
- PyMuPDF
163
- pyparsing
164
- pypdfium2
165
- PySocks
166
- pyspellchecker
167
- pytesseract
168
- python-bidi
169
- python-dateutil
170
- python-docx
171
- python-dotenv
172
- python-Levenshtein
173
- pytz
174
- PyYAML
175
- RapidFuzz
176
- redis
177
- referencing
178
- regex
179
  requests
180
- rich
181
- rpds-py
182
- rsa
183
- s3transfer
184
- sacremoses
185
- safetensors
186
- scikit-image
187
- scikit-learn
188
- scipy
189
- selenium
190
- sentence-transformers
191
- sentencepiece
192
- setuptools
193
- shapely
194
- shellingham
195
- simsimd
196
- six
197
- smart-open
198
- smmap
199
- sniffio
200
- sortedcontainers
201
- soupsieve
202
- spacy
203
- spacy-legacy
204
- spacy-loggers
205
- SQLAlchemy
206
- srsly
207
- streamlit
208
- stringzilla
209
- sympy
210
- tabulate
211
- tenacity
212
- tensorboard
213
- tensorboard-data-server
214
- tensorflow
215
- termcolor
216
- tf_keras
217
- thinc
218
- threadpoolctl
219
- tifffile
220
- tika
221
- tiktoken
222
- together
223
- tokenizers
224
- toml
225
- toolwrapper
226
  torch
227
- torchaudio
228
- torchvision
229
- tornado
230
- tqdm
231
- transformers
232
- trio
233
- trio-websocket
234
- typer
235
- typing-inspect
236
- typing_extensions
237
- tzdata
238
- uctools
239
- uritemplate
240
- urllib3
241
- wasabi
242
- watchdog
243
- weasel
244
- websocket-client
245
- Werkzeug
246
- wheel
247
- wrapt
248
- wsproto
249
- yarl
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  elasticsearch
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  requests
3
+ beautifulsoup4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4
  torch
5
+ together
6
+ python-dotenv
7
+ tiktoken
8
+ nltk
9
+ sentence-transformers
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
requirementsS.txt ADDED
@@ -0,0 +1,249 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ absl-py
2
+ aiohappyeyeballs
3
+ aiohttp
4
+ aiolimiter
5
+ aiosignal
6
+ albucore
7
+ albumentations
8
+ altair
9
+ annotated-types
10
+ anyio
11
+ astor
12
+ astunparse
13
+ attrs
14
+ banks
15
+ beautifulsoup4
16
+ blinker
17
+ blis
18
+ boto3
19
+ botocore
20
+ cachelib
21
+ cachetools
22
+ catalogue
23
+ certifi
24
+ cffi
25
+ charset-normalizer
26
+ click
27
+ cloudpathlib
28
+ colorama
29
+ confection
30
+ contourpy
31
+ cryptography
32
+ cycler
33
+ cymem
34
+ Cython
35
+ dataclasses-json
36
+ decorator
37
+ deep-translator
38
+ Deprecated
39
+ dirtyjson
40
+ docopt
41
+ easyocr
42
+ elastic-transport
43
+ elasticsearch
44
+ et_xmlfile
45
+ eval_type_backport
46
+ filelock
47
+ filetype
48
+ fire
49
+ Flask
50
+ Flask-Cors
51
+ Flask-Session
52
+ flatbuffers
53
+ fonttools
54
+ frozenlist
55
+ fsspec
56
+ gast
57
+ gitdb
58
+ GitPython
59
+ google-ai-generativelanguage
60
+ google-api-core
61
+ google-api-python-client
62
+ google-auth
63
+ google-auth-httplib2
64
+ google-cloud-core
65
+ google-cloud-speech
66
+ google-cloud-storage
67
+ google-crc32c
68
+ google-generativeai
69
+ google-pasta
70
+ google-resumable-media
71
+ googleapis-common-protos
72
+ greenlet
73
+ griffe
74
+ grpcio
75
+ grpcio-status
76
+ h11
77
+ h5py
78
+ httpcore
79
+ httplib2
80
+ httpx
81
+ httpx-sse
82
+ huggingface-hub
83
+ ibm-cloud-sdk-core
84
+ ibm-cos-sdk
85
+ ibm-cos-sdk-core
86
+ ibm-cos-sdk-s3transfer
87
+ ibm-generative-ai
88
+ ibm-watson
89
+ idna
90
+ imageio
91
+ itsdangerous
92
+ Jinja2
93
+ jmespath
94
+ joblib
95
+ jsonschema
96
+ jsonschema-specifications
97
+ keras
98
+ keybert
99
+ kiwisolver
100
+ langcodes
101
+ language_data
102
+ lazy_loader
103
+ Levenshtein
104
+ libclang
105
+ llama-index-core
106
+ llama-index-embeddings-huggingface
107
+ lmdb
108
+ lxml
109
+ marisa-trie
110
+ Markdown
111
+ markdown-it-py
112
+ MarkupSafe
113
+ marshmallow
114
+ matplotlib
115
+ mdurl
116
+ ml_dtypes
117
+ mosestokenizer
118
+ mpmath
119
+ msgspec
120
+ multidict
121
+ murmurhash
122
+ mypy-extensions
123
+ namex
124
+ narwhals
125
+ nest-asyncio
126
+ networkx
127
+ ninja
128
+ nltk
129
+ numpy
130
+ opencv-contrib-python
131
+ opencv-python
132
+ opencv-python-headless
133
+ openfile
134
+ openpyxl
135
+ opt-einsum
136
+ optree
137
+ outcome
138
+ packaging
139
+ paddleocr
140
+ paddlepaddle
141
+ pandas
142
+ pdf2image
143
+ pdfminer.six
144
+ pdfplumber
145
+ pillow
146
+ platformdirs
147
+ preshed
148
+ propcache
149
+ proto-plus
150
+ protobuf
151
+ pyarrow
152
+ pyasn1
153
+ pyasn1_modules
154
+ pyclipper
155
+ pycparser
156
+ pydantic
157
+ pydantic_core
158
+ pydeck
159
+ pydub
160
+ Pygments
161
+ PyJWT
162
+ PyMuPDF
163
+ pyparsing
164
+ pypdfium2
165
+ PySocks
166
+ pyspellchecker
167
+ pytesseract
168
+ python-bidi
169
+ python-dateutil
170
+ python-docx
171
+ python-dotenv
172
+ python-Levenshtein
173
+ pytz
174
+ PyYAML
175
+ RapidFuzz
176
+ redis
177
+ referencing
178
+ regex
179
+ requests
180
+ rich
181
+ rpds-py
182
+ rsa
183
+ s3transfer
184
+ sacremoses
185
+ safetensors
186
+ scikit-image
187
+ scikit-learn
188
+ scipy
189
+ selenium
190
+ sentence-transformers
191
+ sentencepiece
192
+ setuptools
193
+ shapely
194
+ shellingham
195
+ simsimd
196
+ six
197
+ smart-open
198
+ smmap
199
+ sniffio
200
+ sortedcontainers
201
+ soupsieve
202
+ spacy
203
+ spacy-legacy
204
+ spacy-loggers
205
+ SQLAlchemy
206
+ srsly
207
+ streamlit
208
+ stringzilla
209
+ sympy
210
+ tabulate
211
+ tenacity
212
+ tensorboard
213
+ tensorboard-data-server
214
+ tensorflow
215
+ termcolor
216
+ tf_keras
217
+ thinc
218
+ threadpoolctl
219
+ tifffile
220
+ tika
221
+ tiktoken
222
+ together
223
+ tokenizers
224
+ toml
225
+ toolwrapper
226
+ torch
227
+ torchaudio
228
+ torchvision
229
+ tornado
230
+ tqdm
231
+ transformers
232
+ trio
233
+ trio-websocket
234
+ typer
235
+ typing-inspect
236
+ typing_extensions
237
+ tzdata
238
+ uctools
239
+ uritemplate
240
+ urllib3
241
+ wasabi
242
+ watchdog
243
+ weasel
244
+ websocket-client
245
+ Werkzeug
246
+ wheel
247
+ wrapt
248
+ wsproto
249
+ yarl