scraperai

View on PyPIReverse Dependencies (0)

0.0.2 scraperai-0.0.2-py3-none-any.whl

Wheel Details

Project: scraperai
Version: 0.0.2
Filename: scraperai-0.0.2-py3-none-any.whl
Download: [link]
Size: 63806
MD5: a8c491ea3f60c8f140f437343f8da44a
SHA256: 987cf6b1ad9faeafed9cbf0e681c93bc8daf39bb897dafb289b57c6884bbf16b
Uploaded: 2024-04-17 13:45:23 +0000

dist-info

METADATA

Metadata-Version: 2.1
Name: scraperai
Version: 0.0.2
Summary: ScraperAI is an open-source, AI-powered tool designed to simplify web scraping for users of all skill levels.
Author: Iakov Kaiumov
Author-Email: help[at]scraper-ai.com
Home-Page: https://github.com/scraperai/scraperai
License: GPL-3.0 license
Requires-Dist: packaging (==23.2)
Requires-Dist: langchain (==0.1.16)
Requires-Dist: langchain-community
Requires-Dist: langchain-openai
Requires-Dist: langchain-text-splitters
Requires-Dist: openai
Requires-Dist: tiktoken
Requires-Dist: htmlmin
Requires-Dist: requests
Requires-Dist: beautifulsoup4
Requires-Dist: lxml
Requires-Dist: selenium (==4.9.1)
Requires-Dist: webdriver-manager
Requires-Dist: numpy (==1.26.4)
Requires-Dist: pandas
Requires-Dist: openpyxl
Requires-Dist: tabulate
Requires-Dist: python-dotenv
Requires-Dist: tqdm
Requires-Dist: retry
Requires-Dist: Pillow
Requires-Dist: pydantic
Requires-Dist: appdirs
Requires-Dist: click
Description-Content-Type: text/markdown
License-File: LICENSE
[Description omitted; length: 4765 characters]

WHEEL

Wheel-Version: 1.0
Generator: bdist_wheel (0.43.0)
Root-Is-Purelib: true
Tag: py3-none-any

RECORD

Path Digest Size
scraperai/__init__.py sha256=thfZDJctCXU2rizeiNJsD2R8uiRz-qtobLHcXFlxNmc 230
scraperai/exceptions.py sha256=qIxVS5a52gsAllcQALFR43OnVCjd8s9e4FYsYV6mr50 76
scraperai/models.py sha256=8ZgizqnmiahTJxjcQpEljub3Toh2NRJ8P2BPeMcKVhE 1949
scraperai/scraper.py sha256=w28DCEAciXXCstWuGDO7P5CStvc1n0KvVK1NCh6qFWE 3129
scraperai/cli/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
scraperai/cli/app.py sha256=wpeg6Gc1mXw8ju7EqRmU58rTgYvth0viWPxNk_qGIxo 1449
scraperai/cli/controller.py sha256=kPO7i3lQHITPQQD6tQi7Epn75YaczkS6YKvwuWNAWq8 14853
scraperai/cli/model.py sha256=PZNXa3C7NWJKgFZS_sZ5iG1DZYiju6plbNvjg9NCjTA 544
scraperai/cli/utils.py sha256=kzee6e-Yn6jbbnoLW1q7HmerdXEQNSim7bpuNYlsIJ0 2062
scraperai/cli/view.py sha256=k_CtNnAkRFdev1Orj7I6aqiw0DyUnH2Od3lTQTsTZDY 9736
scraperai/crawlers/__init__.py sha256=YjK810pohtk3blHZbQCzWUznTqZ-uNQdYJ4ppG5kcQg 165
scraperai/crawlers/base.py sha256=JtStf0fXVQIPS2hVRCIuDsohfdHGkXwgHSdGXUZ6yRo 417
scraperai/crawlers/requests.py sha256=dRMxzoBPGMdXxvfMepjuS1LBdtySHecaHLLEcBXzz4c 1383
scraperai/crawlers/selenium.py sha256=uPDxUekq4LCzomPY431sMv1-5qfCT-QrPLN_fGxYneg 3473
scraperai/crawlers/webdriver/__init__.py sha256=Fd-rjDZo16skFGKm9LCP22NwVBIDLBiTCB7-qV3UVlM 120
scraperai/crawlers/webdriver/base.py sha256=RidyAIE82Vdm604M1CghnHwtFvSOSk11tAD1ZaMSaGA 636
scraperai/crawlers/webdriver/local.py sha256=SI-6DMYgQB-2Afmv1bw9HNvr-lw4ud0NN_9MQXSgFLY 2202
scraperai/crawlers/webdriver/manager.py sha256=fBRbIcS_5x5mMrGAwLMx1VPfjeI2R07HbDHO7AVeZk0 2047
scraperai/crawlers/webdriver/remote.py sha256=0d85ee14z4bm7D9QVCTUQ8NXUXp6-vjEJG8YuVXJ7QQ 3571
scraperai/crawlers/webdriver/storage.py sha256=pydUR14xUuVgoG_YroK64qhI9pq5FsXOzPw03YSGGbE 1373
scraperai/crawlers/webdriver/useragents.py sha256=Uh4VIzIyC8hjdjEHoH3kzhMQmi1Z5bH_3q-3SrU2VJo 288
scraperai/crawlers/webdriver/useragents.txt sha256=CmUP_gH_81phVKvGtAVIdQdawnVjauOsw3Q9son-PvA 98063
scraperai/crawlers/webdriver/utils.py sha256=y7qSrAICjpdP1Ao7L282UaUdhNfysNY_lvO2YODObQw 709
scraperai/lm/__init__.py sha256=tj48mrRINMKK96wx5sS1vWHEi0tb3sPQ2zTeqCD-f_Q 86
scraperai/lm/base.py sha256=6VxKllPOlFUzCGmbk78qB2Ks6nD7xbMRG4g9Uq5r_dg 508
scraperai/lm/openai.py sha256=4hV200Vl8h8CzyBtoMGgwzCnaTmpT2LBqPV4uLVYFvQ 2774
scraperai/parsers/__init__.py sha256=Nc7OYYy5e4Nnzb5ZJHzToiKl8oWQN6lr2d8A9UX7iLw 352
scraperai/parsers/agent.py sha256=UyytsZIX1YzY6S-LMStRe5V7XyR3Nnkp0pEcGbbtQi0 1425
scraperai/parsers/catalog_item_detector.py sha256=x54r4I4MXTgj1voPxNajkiiP1yxAfV7HsdOWZD8rd2s 4058
scraperai/parsers/data_fields_extractor.py sha256=ztzN-tp39MmLjZEBUpl5WQBuqdxb_Cns4oeA482sLxc 6155
scraperai/parsers/pagination_detector.py sha256=LC8ew0LJvXQfWhTUBaSf7ONU3vURlNtrR_4HtDAOk5o 4299
scraperai/parsers/parserai.py sha256=HpPxWbDoAkx5ZI0A5iqcoyF0PLLAioxNYPkbwDn4rn4 4080
scraperai/parsers/utils.py sha256=7caPDNctNSmER2666kS1r5cSFFEOjYhpX87K7PjRWiw 2111
scraperai/parsers/webpage_classifier.py sha256=3AWP21_eq7khWJL1iC_VfvwrnHE1eDC785qXzp76bE4 2162
scraperai/parsers/webpage_descriptor.py sha256=uFqLp1nt-vgHUA5qZaTPLBIT3qfZ6E0edPG02QQgZ3I 6001
scraperai/utils/__init__.py sha256=10ZQKSr3IOLAuGYwrMfZz8KR4unDxYU-mh0YyVkOmZY 1847
scraperai/utils/data.py sha256=eOagiMlCQKZfn47UD5QwesmNzLRowFfkYkQJMZ3NRQg 489
scraperai/utils/html.py sha256=eCIaQQ19XM7hlp5JN4AHeyr35Ycw2HZWRC6_EqDrsX8 6313
scraperai/utils/image.py sha256=3o4cnJXrMscLks32HX4yV9yldwmKOuqmzWiAoXnK49A 1562
tests/__init__.py sha256=T6X3pZLQ_BtI5nT5E0lUoRLpy_Lca-3dPpdaHYhcvqg 20
tests/settings.py sha256=oGWBWPqvnYRlDhh6afw5gLvrugtDR_rJpEFQkPlCFd8 995
tests/test_classification.py sha256=XqMYu6HjFI3W81Sq9F1TaBFB5ODoAn8sqbv8zTDCk80 1261
tests/test_detection.py sha256=LSopu7kvGxhxdAz0AF8VZwJMeAQZ9bddwRV9bMO9fS0 1700
tests/test_extractor.py sha256=Oc5562rKH_l0WUGm6xOEDOZC_uiachrz4sDFVYLOkmg 1687
tests/test_html_utils.py sha256=LlbjumP1r1YOp9z1hq3PEneG0DBZPuG9MD-V4j6tkTo 4912
tests/test_webdriver.py sha256=dIRJr7nbomZUrOAzsLpxYEo1963pU4Xno1d_CLMsZuo 3198
scraperai-0.0.2.dist-info/LICENSE sha256=ixuiBLtpoK3iv89l7ylKkg9rs2GzF9ukPH7ynZYzK5s 35148
scraperai-0.0.2.dist-info/METADATA sha256=pKxWW8IvUUPsxtMIcUDihmI8SVOJrgj570c6JZf97Rg 5776
scraperai-0.0.2.dist-info/WHEEL sha256=GJ7t_kWBFywbagK5eo9IoUwLW6oyOeTKmQ-9iHFVNxQ 92
scraperai-0.0.2.dist-info/entry_points.txt sha256=kQOuITYeob2D1tmCTxq3K2j01z2OTSgX4jtKBAcpJ18 53
scraperai-0.0.2.dist-info/top_level.txt sha256=OsaYuCzFw19l_YsJdnIPCMnWCXOYAw0op7ArI_tWXc0 16
scraperai-0.0.2.dist-info/RECORD

top_level.txt

scraperai
tests

entry_points.txt

scraperai = scraperai.cli.app:main