Added OpenSourceAI and conversational support in the extension

SilasMarvin · SilasMarvin · commit 3ff2f07e7a4e · 2023-11-29T14:59:21.000-08:00
diff --git a/pgml-extension/src/api.rs b/pgml-extension/src/api.rs
@@ -632,6 +632,37 @@ pub fn transform_string(
     }
 }
 
+#[cfg(all(feature = "python", not(feature = "use_as_lib")))]
+#[pg_extern(immutable, parallel_safe, name = "transform")]
+#[allow(unused_variables)] // cache is maintained for api compatibility
+pub fn transform_conversational_json(
+    task: JsonB,
+    args: default!(JsonB, "'{}'"),
+    inputs: default!(Vec<JsonB>, "ARRAY[]::JSONB[]"),
+    cache: default!(bool, false),
+) -> JsonB {
+    match crate::bindings::transformers::transform(&task.0, &args.0, inputs) {
+        Ok(output) => JsonB(output),
+        Err(e) => error!("{e}"),
+    }
+}
+
+#[cfg(all(feature = "python", not(feature = "use_as_lib")))]
+#[pg_extern(immutable, parallel_safe, name = "transform")]
+#[allow(unused_variables)] // cache is maintained for api compatibility
+pub fn transform_conversational_string(
+    task: String,
+    args: default!(JsonB, "'{}'"),
+    inputs: default!(Vec<JsonB>, "ARRAY[]::JSONB[]"),
+    cache: default!(bool, false),
+) -> JsonB {
+    let task_json = json!({ "task": task });
+    match crate::bindings::transformers::transform(&task_json, &args.0, inputs) {
+        Ok(output) => JsonB(output),
+        Err(e) => error!("{e}"),
+    }
+}
+
 #[cfg(all(feature = "python", not(feature = "use_as_lib")))]
 #[pg_extern(immutable, parallel_safe, name = "transform_stream")]
 #[allow(unused_variables)] // cache is maintained for api compatibility
@@ -642,10 +673,13 @@ pub fn transform_stream_json(
     cache: default!(bool, false),
 ) -> SetOfIterator<'static, String> {
     // We can unwrap this becuase if there is an error the current transaction is aborted in the map_err call
-    let python_iter =
-        crate::bindings::transformers::transform_stream_iterator(&task.0, &args.0, input)
-            .map_err(|e| error!("{e}"))
-            .unwrap();
+    let python_iter = crate::bindings::transformers::transform_stream_iterator(
+        &task.0,
+        &args.0,
+        input.to_string(),
+    )
+    .map_err(|e| error!("{e}"))
+    .unwrap();
     SetOfIterator::new(python_iter)
 }
 
@@ -667,6 +701,51 @@ pub fn transform_stream_string(
     SetOfIterator::new(python_iter)
 }
 
+#[cfg(all(feature = "python", not(feature = "use_as_lib")))]
+#[pg_extern(immutable, parallel_safe, name = "transform_stream")]
+#[allow(unused_variables)] // cache is maintained for api compatibility
+pub fn transform_stream_conversational_json(
+    task: JsonB,
+    args: default!(JsonB, "'{}'"),
+    input: default!(JsonB, "'[]'::JSONB"),
+    cache: default!(bool, false),
+) -> SetOfIterator<'static, String> {
+    // If they have Vec<JsonB> inputs lets make sure they have the write task
+    if !task.0["task"]
+        .as_str()
+        .is_some_and(|v| v == "conversational")
+    {
+        error!("ARRAY[]::JSONB inputs for transformer_stream should only be used with a conversational task");
+    }
+    // We can unwrap this becuase if there is an error the current transaction is aborted in the map_err call
+    let python_iter =
+        crate::bindings::transformers::transform_stream_iterator(&task.0, &args.0, input.0)
+            .map_err(|e| error!("{e}"))
+            .unwrap();
+    SetOfIterator::new(python_iter)
+}
+
+#[cfg(all(feature = "python", not(feature = "use_as_lib")))]
+#[pg_extern(immutable, parallel_safe, name = "transform_stream")]
+#[allow(unused_variables)] // cache is maintained for api compatibility
+pub fn transform_stream_conversational_string(
+    task: String,
+    args: default!(JsonB, "'{}'"),
+    input: default!(JsonB, "'[]'::JSONB"),
+    cache: default!(bool, false),
+) -> SetOfIterator<'static, String> {
+    if task != "conversational" {
+        error!("ARRAY[]::JSONB inputs for transformer_stream should only be used with a conversational task");
+    }
+    let task_json = json!({ "task": task });
+    // We can unwrap this becuase if there is an error the current transaction is aborted in the map_err call
+    let python_iter =
+        crate::bindings::transformers::transform_stream_iterator(&task_json, &args.0, input.0)
+            .map_err(|e| error!("{e}"))
+            .unwrap();
+    SetOfIterator::new(python_iter)
+}
+
 #[cfg(feature = "python")]
 #[pg_extern(immutable, parallel_safe, name = "generate")]
 fn generate(project_name: &str, inputs: &str, config: default!(JsonB, "'{}'")) -> String {
diff --git a/pgml-extension/src/bindings/transformers/transform.rs b/pgml-extension/src/bindings/transformers/transform.rs
@@ -4,6 +4,7 @@ use anyhow::Result;
 use pgrx::*;
 use pyo3::prelude::*;
 use pyo3::types::{IntoPyDict, PyDict, PyTuple};
+use pyo3::AsPyPointer;
 
 create_pymodule!("/src/bindings/transformers/transformers.py");
 
@@ -41,10 +42,10 @@ impl Iterator for TransformStreamIterator {
     }
 }
 
-pub fn transform(
+pub fn transform<T: serde::Serialize>(
     task: &serde_json::Value,
     args: &serde_json::Value,
-    inputs: Vec<&str>,
+    inputs: T,
 ) -> Result<serde_json::Value> {
     crate::bindings::python::activate()?;
     whitelist::verify_task(task)?;
@@ -74,17 +75,17 @@ pub fn transform(
     Ok(serde_json::from_str(&results)?)
 }
 
-pub fn transform_stream(
+pub fn transform_stream<T: serde::Serialize>(
     task: &serde_json::Value,
     args: &serde_json::Value,
-    input: &str,
+    input: T,
 ) -> Result<Py<PyAny>> {
     crate::bindings::python::activate()?;
     whitelist::verify_task(task)?;
 
     let task = serde_json::to_string(task)?;
     let args = serde_json::to_string(args)?;
-    let inputs = serde_json::to_string(&vec![input])?;
+    let input = serde_json::to_string(&input)?;
 
     Python::with_gil(|py| -> Result<Py<PyAny>> {
         let transform: Py<PyAny> = get_module!(PY_MODULE)
@@ -99,7 +100,7 @@ pub fn transform_stream(
                     &[
                         task.into_py(py),
                         args.into_py(py),
-                        inputs.into_py(py),
+                        input.into_py(py),
                         true.into_py(py),
                     ],
                 ),
@@ -110,10 +111,10 @@ pub fn transform_stream(
     })
 }
 
-pub fn transform_stream_iterator(
+pub fn transform_stream_iterator<T: serde::Serialize>(
     task: &serde_json::Value,
     args: &serde_json::Value,
-    input: &str,
+    input: T,
 ) -> Result<TransformStreamIterator> {
     let python_iter = transform_stream(task, args, input)
         .map_err(|e| error!("{e}"))
diff --git a/pgml-extension/src/bindings/transformers/transformers.py b/pgml-extension/src/bindings/transformers/transformers.py
@@ -41,6 +41,7 @@
     TrainingArguments,
     Trainer,
     TextStreamer,
+    Conversation
 )
 from threading import Thread
 from typing import Optional
@@ -198,8 +199,8 @@ def __init__(self, model_name, **task):
         self.task = "text-generation"
 
     def stream(self, inputs, **kwargs):
-        output = self.model(inputs[0], stream=True, **kwargs)
-        return ThreadedGeneratorIterator(output, inputs[0])
+        output = self.model(inputs, stream=True, **kwargs)
+        return ThreadedGeneratorIterator(output, inputs)
 
     def __call__(self, inputs, **kwargs):
         outputs = []
@@ -224,6 +225,7 @@ def __init__(self, model_name, **kwargs):
                 "summarization",
                 "translation",
                 "text-generation",
+                "conversational"
             ]
         ):
             self.task = kwargs.pop("task")
@@ -238,7 +240,7 @@ def __init__(self, model_name, **kwargs):
                 )
             elif self.task == "summarization" or self.task == "translation":
                 self.model = AutoModelForSeq2SeqLM.from_pretrained(model_name, **kwargs)
-            elif self.task == "text-generation":
+            elif self.task == "text-generation" or self.task == "conversational":
                 self.model = AutoModelForCausalLM.from_pretrained(model_name, **kwargs)
             else:
                 raise PgMLException(f"Unhandled task: {self.task}")
@@ -266,15 +268,30 @@ def __init__(self, model_name, **kwargs):
             self.tokenizer = self.pipe.tokenizer
 
     def stream(self, inputs, **kwargs):
-        streamer = TextIteratorStreamer(self.tokenizer)
-        inputs = self.tokenizer(inputs, return_tensors="pt").to(self.model.device)
-        generation_kwargs = dict(inputs, streamer=streamer, **kwargs)
+        streamer = None
+        generation_kwargs = None
+        if self.task == "conversational":
+            streamer = TextIteratorStreamer(self.tokenizer, skip_prompt=True)
+            inputs = tokenized_chat = self.tokenizer.apply_chat_template(inputs, tokenize=True, add_generation_prompt=True, return_tensors="pt").to(self.model.device)
+            generation_kwargs = dict(inputs=inputs, streamer=streamer, **kwargs)
+        else:
+            streamer = TextIteratorStreamer(self.tokenizer)
+            inputs = self.tokenizer([inputs], return_tensors="pt").to(self.model.device)
+            generation_kwargs = dict(inputs, streamer=streamer, **kwargs)
         thread = Thread(target=self.model.generate, kwargs=generation_kwargs)
         thread.start()
         return streamer
 
     def __call__(self, inputs, **kwargs):
-        return self.pipe(inputs, **kwargs)
+        if self.task == "conversational":
+            outputs = []
+            for conversation in inputs:
+                conversation = Conversation(conversation)
+                conversation = self.pipe(conversation, **kwargs)
+                outputs.append(conversation.generated_responses[-1])
+            return outputs
+        else:
+            return self.pipe(inputs, **kwargs)
 
 
 def get_model_from(task):
diff --git a/pgml-sdks/pgml/build.rs b/pgml-sdks/pgml/build.rs
@@ -14,7 +14,7 @@ const ADDITIONAL_DEFAULTS_FOR_JAVASCRIPT: &[u8] = br#"
 export function init_logger(level?: string, format?: string): void;
 export function migrate(): Promise<void>;
 
-export type Json = { [key: string]: any };
+export type Json = any;
 export type DateTime = Date;
 
 export function newCollection(name: string, database_url?: string): Collection;
@@ -23,6 +23,7 @@ export function newSplitter(name?: string, parameters?: Json): Splitter;
 export function newBuiltins(database_url?: string): Builtins;
 export function newPipeline(name: string, model?: Model, splitter?: Splitter, parameters?: Json): Pipeline;
 export function newTransformerPipeline(task: string, model?: string, args?: Json, database_url?: string): TransformerPipeline;
+export function newOpenSourceAI(database_url?: string): OpenSourceAI;
 "#;
 
 fn main() {
diff --git a/pgml-sdks/pgml/javascript/tests/typescript-tests/test.ts b/pgml-sdks/pgml/javascript/tests/typescript-tests/test.ts
@@ -299,7 +299,29 @@ it("can transformer pipeline stream", async () => {
     output.push(result.value);
     result = await it.next();
   }
-  expect(output.length).toBeGreaterThan(0)
+  expect(output.length).toBeGreaterThan(0);
+});
+
+///////////////////////////////////////////////////
+// Test OpenSourceAI //////////////////////////////
+///////////////////////////////////////////////////
+
+it("can open source ai create", async () => {
+  const client = pgml.newOpenSourceAI();
+  const results = client.chat_completions_create(
+        "mistralai/Mistral-7B-v0.1",
+        [
+            {
+                role: "system",
+                content: "You are a friendly chatbot who always responds in the style of a pirate",
+            },
+            {
+                role: "user",
+                content: "How many helicopters can a human eat in one sitting?",
+            },
+        ],
+  );
+  expect(results.choices.length).toBeGreaterThan(0);
 });
 
 ///////////////////////////////////////////////////
diff --git a/pgml-sdks/pgml/python/tests/test.py b/pgml-sdks/pgml/python/tests/test.py
@@ -307,7 +307,8 @@ async def test_order_documents():
 async def test_transformer_pipeline():
     t = pgml.TransformerPipeline("text-generation")
     it = await t.transform(["AI is going to"], {"max_new_tokens": 5})
-    assert (len(it)) > 0
+    assert len(it) > 0
+
 
 @pytest.mark.asyncio
 async def test_transformer_pipeline_stream():
@@ -316,7 +317,31 @@ async def test_transformer_pipeline_stream():
     total = []
     async for c in it:
         total.append(c)
-    assert (len(total)) > 0
+    assert len(total) > 0
+
+
+###################################################
+## Transformer Pipeline Tests #####################
+###################################################
+
+
+def test_open_source_ai_create():
+    client = pgml.OpenSourceAI()
+    results = client.chat_completions_create(
+        "mistralai/Mistral-7B-v0.1",
+        [
+            {
+                "role": "system",
+                "content": "You are a friendly chatbot who always responds in the style of a pirate",
+            },
+            {
+                "role": "user",
+                "content": "How many helicopters can a human eat in one sitting?",
+            },
+        ],
+        temperature=0.85
+    )
+    assert len(results["choices"]) > 0
 
 
 ###################################################
diff --git a/pgml-sdks/pgml/src/lib.rs b/pgml-sdks/pgml/src/lib.rs
@@ -19,6 +19,7 @@ mod languages;
 pub mod migrations;
 mod model;
 pub mod models;
+mod open_source_ai;
 mod order_by_builder;
 mod pipeline;
 mod queries;
@@ -34,6 +35,7 @@ mod utils;
 pub use builtins::Builtins;
 pub use collection::Collection;
 pub use model::Model;
+pub use open_source_ai::OpenSourceAI;
 pub use pipeline::Pipeline;
 pub use splitter::Splitter;
 pub use transformer_pipeline::TransformerPipeline;
@@ -152,6 +154,7 @@ fn pgml(_py: pyo3::Python, m: &pyo3::types::PyModule) -> pyo3::PyResult<()> {
     m.add_class::<splitter::SplitterPython>()?;
     m.add_class::<builtins::BuiltinsPython>()?;
     m.add_class::<transformer_pipeline::TransformerPipelinePython>()?;
+    m.add_class::<open_source_ai::OpenSourceAIPython>()?;
     Ok(())
 }
 
@@ -201,6 +204,10 @@ fn main(mut cx: neon::context::ModuleContext) -> neon::result::NeonResult<()> {
         transformer_pipeline::TransformerPipelineJavascript::new,
     )?;
     cx.export_function("newPipeline", pipeline::PipelineJavascript::new)?;
+    cx.export_function(
+        "newOpenSourceAI",
+        open_source_ai::OpenSourceAIJavascript::new,
+    )?;
     Ok(())
 }
 
diff --git a/pgml-sdks/pgml/src/open_source_ai.rs b/pgml-sdks/pgml/src/open_source_ai.rs
diff --git a/pgml-sdks/pgml/src/transformer_pipeline.rs b/pgml-sdks/pgml/src/transformer_pipeline.rs
diff --git a/pgml-sdks/pgml/src/types.rs b/pgml-sdks/pgml/src/types.rs