Add docs for C and C++ to the website (#183)

VivekPanyam · Oct 27, 2023 · 60afa98 · 60afa98
1 parent bc46639
commit 60afa98
Show file tree

Hide file tree

Showing 6 changed files with 282 additions and 3 deletions.
diff --git a/docs/website/components/code.tsx b/docs/website/components/code.tsx
@@ -62,6 +62,8 @@ const LANGUAGE_TAGS = {
     "rust": {"bg": "bg-violet-500", tag: "rust"},
     "json": { "bg": "bg-orange-500", tag: "json" },
     "toml": { "bg": "bg-orange-500", tag: "toml" },
+    "c": { "bg": "bg-lime-500", tag: "c" },
+    "cpp": { "bg": "bg-cyan-500", tag: "c++" },
 }
 
 const Code = ({

diff --git a/docs/website/components/languageselect.tsx b/docs/website/components/languageselect.tsx
@@ -22,8 +22,8 @@ export const LANGUAGES = [
     { name: "JavaScript", enabled: true },
     { name: "TypeScript", enabled: true },
     { name: "Rust", enabled: true },
-    { name: "C", enabled: false },
-    { name: "C++", enabled: false },
+    { name: "C", enabled: true },
+    { name: "C++", enabled: true },
     { name: "C#", enabled: false },
     { name: "Java", enabled: false },
     { name: "Golang", enabled: false },

diff --git a/docs/website/pages/docs/loading.mdx b/docs/website/pages/docs/loading.mdx
@@ -212,6 +212,184 @@ Carton::load(
     },
 )
 ```
+</LanguageItem>
+<LanguageItem forLang='c'>
+
+# Loading a model
+
+<div className="flex items-center space-x-3 not-prose">
+    <p>Select a programming language:</p>
+    <LanguageSelect/>
+</div>
+
+Once you have a packed model, you can load it with a file path or URL. There are two ways to load a model from C. The first uses callbacks:
+
+```c forLang='c'
+#include "carton.h"
+
+void load_callback(Carton *model, CartonStatus status, void *callback_arg);
+
+int main()
+{
+    int load_callback_arg = 123;
+    carton_load("https://carton.pub/google-research/bert-base-uncased", load_callback, (void *)load_callback_arg);
+
+    // Make sure the program doesn't end before the async task completes
+    sleep(60);
+}
+```
+
+This approach can be useful for integrating with existing async/event systems like [libevent](https://libevent.org/) or [libuv](https://libuv.org/).
+
+One of the caveats is that these callbacks are executed from within opaque Carton-owned threads. As a general rule, it's important to avoid doing blocking I/O or extended periods of CPU-bound work within these callbacks. Doing so could block other tasks within Carton's internal async runtime from executing.
+
+To help ease these restrictions, we provide another approach with `CartonAsyncNotifier`. This lets users wait for or poll for new callbacks on a thread they control, removing the above restrictions and making basic C integrations simpler:
+
+```c forLang='c'
+#include "carton.h"
+
+int main()
+{
+    // Create an async notifier
+    CartonAsyncNotifier *notifier;
+    carton_async_notifier_create(&notifier);
+
+    // Load the model
+    Carton *model;
+    CartonNotifierCallback callback;
+    void *callback_arg = (void *)23;
+    carton_async_notifier_register(notifier, &callback, &callback_arg);
+    carton_load("https://carton.pub/google-research/bert-base-uncased", (CartonLoadCallback)callback, callback_arg);
+
+    // Wait for the model to load
+    void *notifier_callback_arg_out;
+    CartonStatus status;
+    carton_async_notifier_wait(notifier, (void **)&model, &status, &notifier_callback_arg_out);
+    assert(notifier_callback_arg_out == (void *)23);
+
+    // ...
+}
+```
+
+With both approaches, Carton loads the model (caching it locally if necessary).
+
+Callbacks and notifications are available for every async function in Carton's interface.
+
+For complete, runnable examples of loading and running a model from C, take a look at this [callback example](https://github.com/VivekPanyam/carton/blob/main/source/carton-bindings-c/tests/basic.c) or this [notifier example](https://github.com/VivekPanyam/carton/blob/main/source/carton-bindings-c/tests/notifier.c).
+
+For more info on async functions in the Carton C interface, see [here](https://github.com/VivekPanyam/carton/blob/main/source/carton-bindings-c/README.md).
+
+If you don't yet have a packed model, take a look at the [packing docs](/docs/packing) or explore the [community model registry](https://carton.pub).
+
+
+</LanguageItem>
+<LanguageItem forLang='c++'>
+
+# Loading a model
+
+<div className="flex items-center space-x-3 not-prose">
+    <p>Select a programming language:</p>
+    <LanguageSelect/>
+</div>
+
+Once you have a packed model, you can load it with a file path or URL. There are three ways to load a model from C++. The first uses futures:
+
+```cpp forLang='c++'
+#include <iostream>
+
+#include "carton.hh"
+
+int main()
+{
+    // Load a model, wait for the future to complete, unwrap the result
+    auto model = carton::Carton::load("https://carton.pub/google-research/bert-base-uncased").get().get_or_throw();
+
+    // Create an input tensor
+    uint64_t shape[]{1};
+    auto tensor = carton::Tensor(carton::DataType::kString, shape);
+    tensor.set_string(0, "Today is a good [MASK].");
+
+    // Create a map of inputs
+    std::unordered_map<std::string, carton::Tensor> inputs;
+    inputs.insert(std::make_pair("input", std::move(tensor)));
+
+    // Run inference, wait for the future to complete, unwrap the result
+    auto out = model.infer(std::move(inputs)).get().get_or_throw();
+
+    // Get the output tensors
+    const auto tokens = out.get_and_remove("tokens");
+    const auto scores = out.get_and_remove("scores");
+
+    const auto scores_data = static_cast<const float *>(scores.data());
+
+    std::cout << "Got output token: " << tokens.get_string(0) << std::endl;
+    std::cout << "Got output scores: " << scores_data[0] << std::endl;
+}
+```
+
+In the above example, `load` and `infer` both return `std::future`s.
+
+The second approach uses callbacks:
+
+```cpp forLang='c++'
+#include "carton.hh"
+
+void load_callback(carton::Result<carton::Carton> model_result, void *arg);
+
+int main()
+{
+    // Load a model
+    int load_callback_arg = 42;
+    carton::Carton::load(
+        "https://carton.pub/google-research/bert-base-uncased",
+        load_callback,
+        (void *)load_callback_arg);
+
+    // Make sure the program doesn't end before the async task completes
+    sleep(60);
+}
+```
+
+This approach can be useful for integrating with existing async/event systems like [libevent](https://libevent.org/) or [libuv](https://libuv.org/).
+
+One of the caveats is that these callbacks are executed from within opaque Carton-owned threads. As a general rule, it's important to avoid doing blocking I/O or extended periods of CPU-bound work within these callbacks. Doing so could block other tasks within Carton's internal async runtime from executing.
+
+To help ease these restrictions, we provide a third approach with `carton::AsyncNotifier`. This lets users wait for or poll for new callbacks on a thread they control, removing the above restrictions. It also makes waiting on several futures more efficient because you get notified when one is ready instead of having to poll all of them.
+
+```cpp forLang='c++'
+#include "carton.hh"
+
+int main()
+{
+    // Create an async notifier
+    carton::AsyncNotifier<carton::Carton> load_notifier;
+
+    // Load a model
+    carton::Carton::load(
+        "https://carton.pub/google-research/bert-base-uncased",
+        load_notifier.handle(),
+        (void *)42);
+
+    // Wait for the model to load
+    auto [model_result, arg] = load_notifier.wait();
+    assert(arg == (void *)42);
+    auto model = model_result.get_or_throw();
+
+    // ...
+}
+```
+
+With all three approaches, Carton loads the model (caching it locally if necessary).
+
+Futures, callbacks and notifications are available for every async function in Carton's interface.
+
+For complete, runnable examples of loading and running a model from C++, take a look at this [callback example](https://github.com/VivekPanyam/carton/blob/main/source/carton-bindings-cpp/tests/callback.cc), this [future example](https://github.com/VivekPanyam/carton/blob/main/source/carton-bindings-cpp/tests/future.cc) or this [notifier example](https://github.com/VivekPanyam/carton/blob/main/source/carton-bindings-cpp/tests/notifier.cc).
+
+For more info on async functions in the Carton C++ interface, see [here](https://github.com/VivekPanyam/carton/blob/main/source/carton-bindings-cpp/README.md).
+
+If you don't yet have a packed model, take a look at the [packing docs](/docs/packing) or explore the [community model registry](https://carton.pub).
+
+
 </LanguageItem>
 <LanguageItem>
 

diff --git a/docs/website/pages/docs/metadata.mdx b/docs/website/pages/docs/metadata.mdx
@@ -1,5 +1,8 @@
 import LanguageSelect, {LanguageSwitch, LanguageItem} from "@/components/languageselect";
 
+<LanguageSwitch>
+<LanguageItem forLang='python,rust,javascript,typescript'>
+
 # Model Metadata
 
 It's possible to fetch model metadata without loading a model. This approach only fetches the data needed to provide the requested information and is therefore quite efficient even with large models.
@@ -311,5 +314,17 @@ console.log(info.manifest_sha256)
 </LanguageItem>
 </LanguageSwitch>
 
+
+</LanguageItem>
+<LanguageItem>
+
+This language currently does not support fetching model metadata. Please check the [quickstart guide](/quickstart) for more info or select a different language.
+
+<div className="flex not-prose">
+    <LanguageSelect/>
+</div>
+</LanguageItem>
+</LanguageSwitch>
+
 import DocsLayout from '@/components/docslayout'
 export default ({children}) => <DocsLayout>{children}</DocsLayout>
diff --git a/docs/website/pages/index.tsx b/docs/website/pages/index.tsx
@@ -134,7 +134,7 @@ export default function Home() {
               // Display each language twice
               [1, 2].flatMap((idx) => LANGUAGES.map((lang) => <span key={`${lang}-${idx}`} className={`${roboto_mono.className} select-none uppercase px-20 text-slate-500`}>
                 {lang}
-                {["python", "rust"].indexOf(lang.toLowerCase()) == -1 && <span className='text-sky-400'>*</span>}
+                {["python", "rust", "c", "c++"].indexOf(lang.toLowerCase()) == -1 && <span className='text-sky-400'>*</span>}
               </span>))
             }
           </div>

diff --git a/docs/website/pages/quickstart.mdx b/docs/website/pages/quickstart.mdx
@@ -8,6 +8,88 @@ import LanguageSelect, {LanguageSwitch, LanguageItem} from "@/components/languag
     <LanguageSelect/>
 </div>
 
+<LanguageSwitch>
+<LanguageItem forLang='c,c++'>
+
+```bash linePrompt='$' forLang='c'
+# Pick the appropriate file for your OS and arch
+wget https://nightly-assets.carton.run/bindings/carton_c_aarch64-apple-darwin.tar.gz
+wget https://nightly-assets.carton.run/bindings/carton_c_aarch64-unknown-linux-gnu.tar.gz
+wget https://nightly-assets.carton.run/bindings/carton_c_x86_64-apple-darwin.tar.gz
+wget https://nightly-assets.carton.run/bindings/carton_c_x86_64-unknown-linux-gnu.tar.gz
+```
+
+```bash linePrompt='$' forLang='c++'
+# Pick the appropriate file for your OS and arch
+wget https://nightly-assets.carton.run/bindings/carton_cpp_aarch64-apple-darwin.tar.gz
+wget https://nightly-assets.carton.run/bindings/carton_cpp_aarch64-unknown-linux-gnu.tar.gz
+wget https://nightly-assets.carton.run/bindings/carton_cpp_x86_64-apple-darwin.tar.gz
+wget https://nightly-assets.carton.run/bindings/carton_cpp_x86_64-unknown-linux-gnu.tar.gz
+```
+
+&nbsp;
+# Load and run a model
+
+If you want to run an existing carton model (or "a carton" for short), you can just pass in a file path or URL.
+
+```c forLang='c'
+#include "carton.h"
+
+void load_callback(Carton *model, CartonStatus status, void *callback_arg)
+{
+    // ...
+}
+
+int main()
+{
+    int load_callback_arg = 123;
+    carton_load("https://carton.pub/google-research/bert-base-uncased", load_callback, (void *)load_callback_arg);
+
+    // Make sure the program doesn't end before the async task completes
+    sleep(60);
+}
+```
+
+```cpp forLang='c++'
+#include <iostream>
+
+#include "carton.hh"
+
+int main()
+{
+    // Load a model, wait for the future to complete, unwrap the result
+    auto model = carton::Carton::load("https://carton.pub/google-research/bert-base-uncased").get().get_or_throw();
+
+    // Create an input tensor
+    uint64_t shape[]{1};
+    auto tensor = carton::Tensor(carton::DataType::kString, shape);
+    tensor.set_string(0, "Today is a good [MASK].");
+
+    // Create a map of inputs
+    std::unordered_map<std::string, carton::Tensor> inputs;
+    inputs.insert(std::make_pair("input", std::move(tensor)));
+
+    // Run inference, wait for the future to complete, unwrap the result
+    auto out = model.infer(std::move(inputs)).get().get_or_throw();
+
+    // Get the output tensors
+    const auto tokens = out.get_and_remove("tokens");
+    const auto scores = out.get_and_remove("scores");
+
+    const auto scores_data = static_cast<const float *>(scores.data());
+
+    std::cout << "Got output token: " << tokens.get_string(0) << std::endl;
+    std::cout << "Got output scores: " << scores_data[0] << std::endl;
+}
+```
+
+See the ["Loading a model"](/docs/loading) docs for complete examples of how to load a model and run inference.
+
+At the moment, packing models and fetching metadata are not supported from C or C++.
+
+</LanguageItem>
+<LanguageItem>
+
 ```bash linePrompt='$' forLang='python'
 pip install cartonml-nightly
 ```
@@ -296,6 +378,8 @@ async fn main() {
 
 Carton routes all of its log messages to the console. If you want to see trace logging, you may need to enable the verbose log level in your browser's console.
 
+</LanguageItem>
+</LanguageSwitch>
 </LanguageItem>
 </LanguageSwitch>