-
Notifications
You must be signed in to change notification settings - Fork 9
Expand file tree
/
Copy pathpackage.json
More file actions
85 lines (85 loc) · 2.33 KB
/
package.json
File metadata and controls
85 lines (85 loc) · 2.33 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
{
"name": "@lightfeed/extractor",
"version": "0.4.1",
"description": "Use LLMs to robustly extract and enrich structured data from HTML and markdown",
"main": "dist/index.js",
"types": "dist/index.d.ts",
"files": [
"dist"
],
"engines": {
"node": ">=18"
},
"scripts": {
"build": "tsc",
"clean": "rimraf dist",
"prepare": "npm run clean && npm run build",
"prepublishOnly": "npm run test:unit",
"test": "jest",
"test:unit": "jest tests/unit",
"test:integration": "jest tests/integration",
"test:watch": "jest --watch",
"test:cov": "jest --coverage",
"test:local": "ts-node src/dev/runLocalTest.ts",
"test:usage": "ts-node src/dev/testUsage.ts",
"test:browser": "ts-node src/dev/testBrowserExtraction.ts",
"test:html2md": "jest tests/integration/html-to-markdown.test.ts",
"test:html2md:update": "git submodule update --init --recursive test-data",
"test:html2md:sync": "cd test-data && git pull origin main && cd ..",
"test:html2md:regenerate": "ts-node src/dev/regenerateGroundTruth.ts",
"lint": "tslint -p tsconfig.json",
"dev": "ts-node src/example.ts",
"dev:html2md": "ts-node src/dev/testHtmlToMarkdown.ts"
},
"repository": {
"type": "git",
"url": "git+https://github.com/lightfeed/extractor.git"
},
"keywords": [
"llm",
"extraction",
"web-scraping",
"html",
"markdown",
"structured-data",
"langchain",
"openai",
"gemini",
"anthropic",
"ollama"
],
"author": "Lightfeed",
"license": "Apache-2.0",
"bugs": {
"url": "https://github.com/lightfeed/extractor/issues"
},
"homepage": "https://github.com/lightfeed/extractor#readme",
"peerDependencies": {
"@langchain/core": ">=1.1.31"
},
"dependencies": {
"cheerio": "^1.0.0",
"jsdom": "^24.1.3",
"jsonrepair": "^3.12.0",
"turndown": "^7.2.0",
"zod": "^3.24.3"
},
"devDependencies": {
"@langchain/core": "^1.1.31",
"@langchain/google-genai": "^2.1.24",
"@langchain/openai": "^1.2.12",
"@types/jest": "^29.5.12",
"@types/node": "^22.15.3",
"@types/turndown": "^5.0.5",
"dotenv": "^16.3.1",
"jest": "^29.7.0",
"playwright": "^1.58.2",
"rimraf": "^5.0.10",
"ts-jest": "^29.1.2",
"ts-node": "^10.9.2",
"typescript": "^5.8.3"
},
"publishConfig": {
"access": "public"
}
}