-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathinput_schema.json
78 lines (78 loc) · 4.26 KB
/
input_schema.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
{
"title": "OpenAI Vector Store Integration",
"type": "object",
"description": "Use Apify's dataset and update OpenAI Vector Store (for OpenAI Assistant V2)",
"schemaVersion": 1,
"properties": {
"vectorStoreId": {
"title": "Vector Store ID",
"type": "string",
"description": "Vector Store ID where the data will be stored",
"editor": "textfield"
},
"openaiApiKey": {
"title": "OpenAI API KEY",
"type": "string",
"description": "OpenAI API KEY",
"editor": "textfield",
"isSecret": true
},
"assistantId": {
"title": "Assistant ID",
"type": "string",
"description": "The ID of an OpenAI Assistant. This parameter is required only when a file exceeds the OpenAI size limit of 5,000,000 tokens (as of 2024-04-23).\n\n When necessary, the model associated with the assistant is utilized to count tokens and split the large file into smaller, manageable segments.",
"editor": "textfield"
},
"datasetFields": {
"title": "A list of dataset fields which should be selected from the dataset",
"type": "array",
"description": "A list of dataset fields which should be selected from the items, only these dataset fields will remain in the resulting record objects.\n\n For example, when using the website content crawler, you might select dataset fields such as `text` and `url`, and `metadata.title` among others, to be included in the vector store file.",
"default": [ "url", "text"],
"prefill": ["url", "text", "metadata.title"],
"editor": "json"
},
"filePrefix": {
"title": "Delete/Create vector store files with a prefix",
"type": "string",
"description": "Using a file prefix helps with the management of vector store file updates by eliminating the need to track each file's ID. For instance, if you set the filePrefix to 'apify-advisor', the Actor will initially locate all files in the vector store with this prefix. Subsequently, it will delete these files and create new ones, also prefixed accordingly.",
"editor": "textfield",
"minLength": 5
},
"fileIdsToDelete": {
"title": "Array of vector store file ids to delete",
"type": "array",
"description": "Delete specified file ids associated with vector store. This can be useful when one needs to delete files that are no longer needed.",
"editor": "json"
},
"saveCrawledFiles": {
"title": "Save crawled files (docs, pdf, pptx) to OpenAI File Store",
"type": "boolean",
"description": "Save files from Apify's key-value store to OpenAI's file store. Useful when utilizing Apify’s website content crawler with the 'saveFiles' option, allowing the found files to be directly stored.",
"default": true
},
"datasetId": {
"title": "Apify's Dataset ID",
"type": "string",
"description": "The Dataset ID is provided automatically when the actor is set up as an integration. You can fill it in explicitly here to enable debugging of the actor",
"editor": "textfield",
"sectionCaption": "Debugging options"
},
"keyValueStoreId": {
"title": "Apify's Key-value store ID (source for json, pdf, pptx files) ",
"type": "string",
"description": "This is the ID for the Key-value store on Apify, which serves as the data source for json, pdf, and pptx files. This ID is automatically provided when the actor is integrated. However, you can manually enter the ID here for debugging purposes.",
"editor": "textfield"
},
"saveInApifyKeyValueStore": {
"title": "Save all created files in the Apify's key-value store",
"type": "boolean",
"description": "Save all created files in the Apify's Key-Value Store to easily check and retrieve all files (this is typically used when debugging)",
"default": false
}
},
"required": [
"vectorStoreId",
"datasetFields",
"openaiApiKey"
]
}