NIFI-12646 Set Python Processor version to 2.0.0-M2

Signed-off-by: David Handermann <exceptionfactory@apache.org>
This commit is contained in:
exceptionfactory 2024-01-19 19:12:04 -06:00
parent 49702f1f51
commit 38fc0a4e8d
No known key found for this signature in database
GPG Key ID: 29B6A52D2AAE8DBA
8 changed files with 12 additions and 7 deletions

View File

@ -30,7 +30,7 @@ class PromptChatGPT(FlowFileTransform):
implements = ['org.apache.nifi.python.processor.FlowFileTransform']
class ProcessorDetails:
version = '2.0.0-SNAPSHOT'
version = '2.0.0-M2'
description = "Submits a prompt to ChatGPT, writing the results either to a FlowFile attribute or to the contents of the FlowFile"
tags = ["text", "chatgpt", "gpt", "machine learning", "ML", "artificial intelligence", "ai", "document", "langchain"]
dependencies = ['langchain==0.0.331', 'openai==0.28.1', 'jsonpath-ng']

View File

@ -104,7 +104,7 @@ class ChunkDocument(FlowFileTransform):
class Java:
implements = ['org.apache.nifi.python.processor.FlowFileTransform']
class ProcessorDetails:
version = '2.0.0-SNAPSHOT'
version = '2.0.0-M2'
description = """Chunks incoming documents that are formatted as JSON Lines into chunks that are appropriately sized for creating Text Embeddings.
The input is expected to be in "json-lines" format, with each line having a 'text' and a 'metadata' element.
Each line will then be split into one or more lines in the output."""

View File

@ -45,7 +45,7 @@ class ParseDocument(FlowFileTransform):
implements = ["org.apache.nifi.python.processor.FlowFileTransform"]
class ProcessorDetails:
version = "2.0.0-SNAPSHOT"
version = "2.0.0-M2"
description = """Parses incoming unstructured text documents and performs optical character recognition (OCR) in order to extract text from PDF and image files.
The output is formatted as "json-lines" with two keys: 'text' and 'metadata'.
Note that use of this Processor may require significant storage space and RAM utilization due to third-party dependencies necessary for processing PDF and image files.

View File

@ -26,7 +26,7 @@ class PutChroma(FlowFileTransform):
implements = ['org.apache.nifi.python.processor.FlowFileTransform']
class ProcessorDetails:
version = '2.0.0-SNAPSHOT'
version = '2.0.0-M2'
description = """Publishes JSON data to a Chroma VectorDB. The Incoming data must be in single JSON per Line format, each with two keys: 'text' and 'metadata'.
The text must be a string, while metadata must be a map with strings for values. Any additional fields will be ignored. If the collection name specified
does not exist, the Processor will automatically create the collection."""

View File

@ -52,7 +52,7 @@ class PutPinecone(FlowFileTransform):
implements = ['org.apache.nifi.python.processor.FlowFileTransform']
class ProcessorDetails:
version = '2.0.0-SNAPSHOT'
version = '2.0.0-M2'
description = """Publishes JSON data to Pinecone. The Incoming data must be in single JSON per Line format, each with two keys: 'text' and 'metadata'.
The text must be a string, while metadata must be a map with strings for values. Any additional fields will be ignored."""
tags = ["pinecone", "vector", "vectordb", "vectorstore", "embeddings", "ai", "artificial intelligence", "ml", "machine learning", "text", "LLM"]

View File

@ -27,7 +27,7 @@ class QueryChroma(FlowFileTransform):
implements = ['org.apache.nifi.python.processor.FlowFileTransform']
class ProcessorDetails:
version = '2.0.0-SNAPSHOT'
version = '2.0.0-M2'
description = "Queries a Chroma Vector Database in order to gather a specified number of documents that are most closely related to the given query."
tags = ["chroma", "vector", "vectordb", "embeddings", "enrich", "enrichment", "ai", "artificial intelligence", "ml", "machine learning", "text", "LLM"]

View File

@ -27,7 +27,7 @@ class QueryPinecone(FlowFileTransform):
implements = ['org.apache.nifi.python.processor.FlowFileTransform']
class ProcessorDetails:
version = '2.0.0-SNAPSHOT'
version = '2.0.0-M2'
description = "Queries Pinecone in order to gather a specified number of documents that are most closely related to the given query."
tags = ["pinecone", "vector", "vectordb", "vectorstore", "embeddings", "ai", "artificial intelligence", "ml", "machine learning", "text", "LLM"]

View File

@ -56,6 +56,11 @@ language governing permissions and limitations under the License. -->
<groupId>com.fasterxml.jackson.datatype</groupId>
<artifactId>jackson-datatype-jsr310</artifactId>
</dependency>
<dependency>
<groupId>javax.annotation</groupId>
<artifactId>javax.annotation-api</artifactId>
<version>1.3.2</version>
</dependency>
</dependencies>
<build>