diff --git a/feed_json_updated.json b/feed_json_updated.json
deleted file mode 100644
index 286f6fe1f..000000000
--- a/feed_json_updated.json
+++ /dev/null
@@ -1 +0,0 @@
-{"version": "https://jsonfeed.org/version/1", "title": "Instructor", "home_page_url": "https://jxnl.github.io/instructor/", "feed_url": "https://jxnl.github.io/instructor/feed_json_updated.json", "description": "A lightweight library for structured outputs with LLMs.", "icon": null, "authors": [{"name": "Jason Liu"}], "language": "en", "items": [{"id": "https://jxnl.github.io/instructor/blog/2023/11/02/ai-engineer-keynote-pydantic-is-all-you-need/", "url": "https://jxnl.github.io/instructor/blog/2023/11/02/ai-engineer-keynote-pydantic-is-all-you-need/", "title": "AI Engineer Keynote: Pydantic is all you need", "content_html": "<h1>AI Engineer Keynote: Pydantic is all you need</h1>\n<p><a href=\"https://www.youtube.com/watch?v=yj-wSRJwrrc\"><img alt=\"Pydantic is all you need\" src=\"https://img.youtube.com/vi/yj-wSRJwrrc/0.jpg\"></a></p>\n<p><a href=\"https://www.youtube.com/watch?v=yj-wSRJwrrc\">Click here to watch the full talk</a></p>", "image": "https://jxnl.github.io/instructor/assets/images/social/blog/posts/aisummit-2023.png", "date_modified": "2024-03-12T02:46:20+00:00", "authors": [{"name": "jxnl"}], "tags": ["prompt engineering", "python", "talks", "video"]}, {"id": "https://jxnl.github.io/instructor/blog/2024/03/05/zero-cost-abstractions/", "url": "https://jxnl.github.io/instructor/blog/2024/03/05/zero-cost-abstractions/", "title": "Why Instructor is the Best Library for Structured LLM Outputs", "content_html": "<h1>Why Instructor is the Best Library for Structured LLM Outputs</h1>\n<p>Large language models (LLMs) like GPTs are incredibly powerful, but working with their open-ended text outputs can be challenging. This is where the Instructor library shines - it allows you to easily map LLM outputs to structured data using Python type annotations.</p>", "image": "https://jxnl.github.io/instructor/assets/images/social/blog/posts/best_framework.png", "date_modified": "2024-03-12T02:46:20+00:00", "authors": [{"name": "jxnl"}], "tags": ["llms", "python"]}, {"id": "https://jxnl.github.io/instructor/blog/2023/11/26/python-caching/", "url": "https://jxnl.github.io/instructor/blog/2023/11/26/python-caching/", "title": "Introduction to Caching in Python", "content_html": "<h1>Introduction to Caching in Python</h1>\n<blockquote>\n<p>Instructor makes working with language models easy, but they are still computationally expensive.</p>\n</blockquote>\n<p>Today, we're diving into optimizing instructor code while maintaining the excellent DX offered by <a href=\"https://docs.pydantic.dev/latest/\">Pydantic</a> models. We'll tackle the challenges of caching Pydantic models, typically incompatible with <code>pickle</code>, and explore solutions that use <code>decorators</code> like <code>functools.cache</code>. Then, we'll craft custom decorators with <code>diskcache</code> and <code>redis</code> to support persistent caching and distributed systems.</p>", "image": "https://jxnl.github.io/instructor/assets/images/social/blog/posts/caching.png", "date_modified": "2024-03-12T02:46:20+00:00", "authors": [{"name": "jxnl"}], "tags": ["caching", "diskcache", "functools", "python", "redis"]}, {"id": "https://jxnl.github.io/instructor/blog/2023/11/05/chain-of-density/", "url": "https://jxnl.github.io/instructor/blog/2023/11/05/chain-of-density/", "title": "Smarter Summaries w/ Finetuning GPT-3.5 and Chain of Density", "content_html": "<h1>Smarter Summaries w/ Finetuning GPT-3.5 and Chain of Density</h1>\n<blockquote>\n<p>Discover how to distil an iterative method like Chain Of Density into a single finetuned model using Instructor</p>\n</blockquote>\n<p>In this article, we'll guide you through implementing the original Chain of Density method using Instructor, then show how to distile a GPT 3.5 model to match GPT-4's iterative summarization capabilities. Using these methods were able to decrease latency by 20x, reduce costs by 50x and maintain entity density.</p>\n<p>By the end you'll end up with a GPT 3.5 model, (fine-tuned using Instructor's great tooling), capable of producing summaries that rival the effectiveness of Chain of Density <a href=\"https://arxiv.org/abs/2309.04269\">[Adams et al. (2023)]</a>. As always, all code is readily available in our <code>examples/chain-of-density</code> folder in our repo for your reference.</p>", "image": "https://jxnl.github.io/instructor/assets/images/social/blog/posts/chain-of-density.png", "date_modified": "2024-03-12T02:46:20+00:00", "authors": [{"name": "ivanleomk"}, {"name": "jxnl"}], "tags": ["chain of density", "distillation", "finetuneing", "gpt-3.5-turbo", "pydantic", "validation"]}, {"id": "https://jxnl.github.io/instructor/blog/2023/11/18/validate-citations/", "url": "https://jxnl.github.io/instructor/blog/2023/11/18/validate-citations/", "title": "Verifying LLM Citations with Pydantic", "content_html": "<h1>Verifying LLM Citations with Pydantic</h1>\n<p>Ensuring the accuracy of information is crucial. This blog post explores how Pydantic's powerful and flexible validators can enhance data accuracy through citation verification.</p>\n<p>We'll start with using a simple substring check to verify citations. Then we'll use <code>instructor</code> itself to power an LLM to verify citations and align answers with the given citations. Finally, we'll explore how we can use these techniques to generate a dataset of accurate responses.</p>", "image": "https://jxnl.github.io/instructor/assets/images/social/blog/posts/citations.png", "date_modified": "2024-03-12T02:46:20+00:00", "authors": [{"name": "jxnl"}], "tags": ["citations", "finetuneing", "hallucination", "pydantic", "validation"]}, {"id": "https://jxnl.github.io/instructor/blog/2024/02/14/weights-and-biases-course/", "url": "https://jxnl.github.io/instructor/blog/2024/02/14/weights-and-biases-course/", "title": "Free course on Weights and Biases", "content_html": "<h1>Free course on Weights and Biases</h1>\n<p>I just released a free course on wits and biases. It goes over the material from [tutorial](../../tutorials/1-introducti...</p>", "image": "https://jxnl.github.io/instructor/assets/images/social/blog/posts/course.png", "date_modified": "2024-03-12T02:46:20+00:00", "authors": [{"name": "jxnl"}], "tags": ["open source"]}, {"id": "https://jxnl.github.io/instructor/blog/2023/10/17/enhancing-python-functions-with-instructor-a-guide-to-fine-tuning-and-distillation/", "url": "https://jxnl.github.io/instructor/blog/2023/10/17/enhancing-python-functions-with-instructor-a-guide-to-fine-tuning-and-distillation/", "title": "Enhancing Python Functions with Instructor: A Guide to Fine-Tuning and Distillation", "content_html": "<h1>Enhancing Python Functions with Instructor: A Guide to Fine-Tuning and Distillation</h1>\n<h2>Introduction</h2>\n<p>Get ready to dive deep into the world of fine-tuning task specific language models with Python functions. We'll explore how the <code>instructor.instructions</code> streamlines this process, making the task you want to distil more efficient and powerful while preserving its original functionality and backwards compatibility.</p>\n<p>If you want to see the full example checkout <a href=\"https://github.com/jxnl/instructor/tree/main/examples/distilations\">examples/distillation</a></p>", "image": "https://jxnl.github.io/instructor/assets/images/social/blog/posts/distilation-part1.png", "date_modified": "2024-03-12T02:46:20+00:00", "authors": [{"name": "jxnl"}], "tags": ["distillation", "finetuning", "function calling", "python"]}, {"id": "https://jxnl.github.io/instructor/blog/2024/03/08/simple-synthetic-data-generation/", "url": "https://jxnl.github.io/instructor/blog/2024/03/08/simple-synthetic-data-generation/", "title": "Simple Synthetic Data Generation", "content_html": "<h1>Simple Synthetic Data Generation</h1>\n<p>What that people have been using instructor for is to generate synthetic data rather than extracting data itself. We can ...</p>", "image": "https://jxnl.github.io/instructor/assets/images/social/blog/posts/fake-data.png", "date_modified": "2024-03-12T02:46:20+00:00", "authors": [{"name": "jxnl"}], "tags": []}, {"id": "https://jxnl.github.io/instructor/blog/2023/11/26/python-generators-and-llm-streaming/", "url": "https://jxnl.github.io/instructor/blog/2023/11/26/python-generators-and-llm-streaming/", "title": "Generators and LLM Streaming", "content_html": "<h1>Generators and LLM Streaming</h1>\n<p>Latency is crucial, especially in eCommerce and newer chat applications like ChatGPT. Streaming is the solution that enables us to enhance the user experience without the need for faster response times.</p>\n<p>And what makes streaming possible? Generators!</p>", "image": "https://jxnl.github.io/instructor/assets/images/social/blog/posts/generator.png", "date_modified": "2024-03-12T02:46:20+00:00", "authors": [{"name": "jxnl"}, {"name": "anmol"}], "tags": ["generators", "python", "streaming"]}, {"id": "https://jxnl.github.io/instructor/blog/2023/09/11/generating-structured-output--json-from-llms/", "url": "https://jxnl.github.io/instructor/blog/2023/09/11/generating-structured-output--json-from-llms/", "title": "Generating Structured Output / JSON from LLMs", "content_html": "<h1>Generating Structured Output / JSON from LLMs</h1>\n<p>Language models have seen significant growth. Using them effectively often requires complex frameworks. This post discusses how Instructor simplifies this process using Pydantic.</p>", "image": "https://jxnl.github.io/instructor/assets/images/social/blog/posts/introduction.png", "date_modified": "2024-03-12T02:46:20+00:00", "authors": [{"name": "jxnl"}], "tags": ["Introduction"]}, {"id": "https://jxnl.github.io/instructor/blog/2024/02/18/seamless-support-with-langsmith/", "url": "https://jxnl.github.io/instructor/blog/2024/02/18/seamless-support-with-langsmith/", "title": "Seamless Support with Langsmith", "content_html": "<h1>Seamless Support with Langsmith</h1>\n<p>Its a common misconception that LangChain's <a href=\"https://www.langchain.com/langsmith\">LangSmith</a> is only compatible with LangChain's models. In reality, LangSmith is a unified DevOps platform for developing, collaborating, testing, deploying, and monitoring LLM applications. In this blog we will explore how LangSmith can be used to enhance the OpenAI client alongside <code>instructor</code>.</p>", "image": "https://jxnl.github.io/instructor/assets/images/social/blog/posts/langsmith.png", "date_modified": "2024-03-12T02:46:20+00:00", "authors": [{"name": "jxnl"}], "tags": ["langsmith"]}, {"id": "https://jxnl.github.io/instructor/blog/2023/11/13/learn-async/", "url": "https://jxnl.github.io/instructor/blog/2023/11/13/learn-async/", "title": "Batch Processing OpenAI using asyncio and Instructor with Python", "content_html": "<h1>Batch Processing OpenAI using <code>asyncio</code> and <code>Instructor</code> with Python</h1>\n<p>Today, I will introduce you to various approaches for using asyncio in Python. We will apply this to batch process data using <code>instructor</code> and learn how to use <code>asyncio.gather</code> and <code>asyncio.as_completed</code> for concurrent data processing. Additionally, we will explore how to limit the number of concurrent requests to a server using <code>asyncio.Semaphore</code>.</p>", "image": "https://jxnl.github.io/instructor/assets/images/social/blog/posts/learn-async.png", "date_modified": "2024-03-12T02:46:20+00:00", "authors": [{"name": "jxnl"}], "tags": ["async", "async/await", "asyncio", "batch", "python"]}, {"id": "https://jxnl.github.io/instructor/blog/2024/03/07/open-source-local-structured-output-pydantic-json-openai/", "url": "https://jxnl.github.io/instructor/blog/2024/03/07/open-source-local-structured-output-pydantic-json-openai/", "title": "Structured Output for Open Source and Local LLMS", "content_html": "<h1>Structured Output for Open Source and Local LLMS</h1>\n<p>Originally, Instructor facilitated API interactions solely via the OpenAI SDK, with an emphasis on function call by incorporating <a href=\"https://pydantic-docs.helpmanual.io/\">Pydantic</a> for structured data validation and serialization. </p>\n<p>As the year progressed, we expanded our toolkit by integrating <a href=\"../../concepts/patching.md#json-mode\">JSON mode</a>, thus enhancing our adaptability to vision models and open source models. This advancement now enables us to support an extensive range of models, from <a href=\"https://openai.com/api/\">GPT</a> and <a href=\"https://mistral.ai\">Mistral</a> to virtually any model accessible through <a href=\"https://ollama.ai\">Ollama</a> and <a href=\"https://huggingface.co/models\">Hugging Face</a>, facilitated by <a href=\"../../hub/llama-cpp-python.md\">llama-cpp-python</a>. For more insights into leveraging JSON mode with various models, refer back to our detailed guide on <a href=\"../../concepts/patching.md\">Patching</a>.</p>\n<p>If you want to check out a course on how to use Instructor with Pydantic, check out our course on <a href=\"https://www.wandb.courses/courses/steering-language-models\">Steering language models towards structured outputs.</a>.</p>", "image": "https://jxnl.github.io/instructor/assets/images/social/blog/posts/open_source.png", "date_modified": "2024-03-12T02:46:20+00:00", "authors": [{"name": "jxnl"}], "tags": ["anyscale", "groq", "llama-cpp-python", "llms", "mistral", "ollama", "opensource", "together"]}, {"id": "https://jxnl.github.io/instructor/blog/2023/09/17/rag-is-more-than-just-embedding-search/", "url": "https://jxnl.github.io/instructor/blog/2023/09/17/rag-is-more-than-just-embedding-search/", "title": "RAG is more than just embedding search", "content_html": "<h1>RAG is more than just embedding search</h1>\n<p>With the advent of large language models (LLM), retrieval augmented generation (RAG) has become a hot topic. However throughout the past year of <a href=\"https://jxnl.co\">helping startups</a> integrate LLMs into their stack I've noticed that the pattern of taking user queries, embedding them, and directly searching a vector store is effectively demoware.</p>\n<p>!!! note \"What is RAG?\"</p>\n<pre><code>Retrieval augmented generation (RAG) is a technique that uses an LLM to generate responses, but uses a search backend to augment the generation. In the past year using text embeddings with a vector databases has been the most popular approach I've seen being socialized.\n</code></pre>\n<figure markdown>\n  ![RAG](img/dumb_rag.png)\n  <figcaption>Simple RAG that embedded the user query and makes a search.</figcaption>\n</figure>\n\n<p>So let's kick things off by examining what I like to call the 'Dumb' RAG Model\u2014a basic setup that's more common than you'd think.</p>", "image": "https://jxnl.github.io/instructor/assets/images/social/blog/posts/rag-and-beyond.png", "date_modified": "2024-03-12T02:46:20+00:00", "authors": [{"name": "jxnl"}], "tags": ["Embeddings", "Personal Assistant", "Query Understanding", "RAG", "Search Systems"]}, {"id": "https://jxnl.github.io/instructor/blog/2023/10/23/good-llm-validation-is-just-good-validation/", "url": "https://jxnl.github.io/instructor/blog/2023/10/23/good-llm-validation-is-just-good-validation/", "title": "Good LLM Validation is Just Good Validation", "content_html": "<h1>Good LLM Validation is Just Good Validation</h1>\n<blockquote>\n<p>What if your validation logic could learn and adapt like a human, but operate at the speed of software? This is the future of validation and it's already here.</p>\n</blockquote>\n<p>Validation is the backbone of reliable software. But traditional methods are static, rule-based, and can't adapt to new challenges. This post looks at how to bring dynamic, machine learning-driven validation into your software stack using Python libraries like <code>Pydantic</code> and <code>Instructor</code>. We validate these outputs using a validation function which conforms to the structure seen below.</p>\n<p><code>python\ndef validation_function(value):\n    if condition(value):\n        raise ValueError(\"Value is not valid\")\n    return mutation(value)</code></p>", "image": "https://jxnl.github.io/instructor/assets/images/social/blog/posts/validation-part1.png", "date_modified": "2024-03-12T02:46:20+00:00", "authors": [{"name": "jxnl"}, {"name": "ivanleomk"}], "tags": ["chain of thought", "citations", "constitutional ai", "guardrails", "pydantic", "validation"]}]}
\ No newline at end of file
diff --git a/feed_rss_created.xml b/feed_rss_created.xml
deleted file mode 100644
index e431e22d6..000000000
--- a/feed_rss_created.xml
+++ /dev/null
@@ -1 +0,0 @@
-<?xml version="1.0" encoding="UTF-8" ?><rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom" xmlns:dc="http://purl.org/dc/elements/1.1/"> <channel><title>Instructor</title><description>A lightweight library for structured outputs with LLMs.</description><link>https://jxnl.github.io/instructor/</link><atom:link href="https://jxnl.github.io/instructor/feed_rss_created.xml" rel="self" type="application/rss+xml" /><managingEditor>Jason Liu</managingEditor><docs>https://github.com/jxnl/instructor/</docs><language>en</language> <pubDate>Tue, 12 Mar 2024 02:47:04 -0000</pubDate> <lastBuildDate>Tue, 12 Mar 2024 02:47:04 -0000</lastBuildDate> <ttl>1440</ttl> <generator>MkDocs RSS plugin - v1.12.1</generator> <item> <title>Simple Synthetic Data Generation</title> <author>jxnl</author> <description>&lt;h1&gt;Simple Synthetic Data Generation&lt;/h1&gt;&lt;p&gt;What that people have been using instructor for is to generate synthetic data rather than extracting data itself. We can ...&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2024/03/08/simple-synthetic-data-generation/</link> <pubDate>Fri, 08 Mar 2024 00:00:00 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_created.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2024/03/08/simple-synthetic-data-generation/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/fake-data.png" type="image/png" length="39736" /> </item> <item> <title>Structured Output for Open Source and Local LLMS</title> <author>jxnl</author> <category>anyscale</category> <category>groq</category> <category>llama-cpp-python</category> <category>llms</category> <category>mistral</category> <category>ollama</category> <category>opensource</category> <category>together</category> <description>&lt;h1&gt;Structured Output for Open Source and Local LLMS&lt;/h1&gt;&lt;p&gt;Originally, Instructor facilitated API interactions solely via the OpenAI SDK, with an emphasis on function call by incorporating &lt;a href=&#34;https://pydantic-docs.helpmanual.io/&#34;&gt;Pydantic&lt;/a&gt; for structured data validation and serialization. &lt;/p&gt;&lt;p&gt;As the year progressed, we expanded our toolkit by integrating &lt;a href=&#34;../../concepts/patching.md#json-mode&#34;&gt;JSON mode&lt;/a&gt;, thus enhancing our adaptability to vision models and open source models. This advancement now enables us to support an extensive range of models, from &lt;a href=&#34;https://openai.com/api/&#34;&gt;GPT&lt;/a&gt; and &lt;a href=&#34;https://mistral.ai&#34;&gt;Mistral&lt;/a&gt; to virtually any model accessible through &lt;a href=&#34;https://ollama.ai&#34;&gt;Ollama&lt;/a&gt; and &lt;a href=&#34;https://huggingface.co/models&#34;&gt;Hugging Face&lt;/a&gt;, facilitated by &lt;a href=&#34;../../hub/llama-cpp-python.md&#34;&gt;llama-cpp-python&lt;/a&gt;. For more insights into leveraging JSON mode with various models, refer back to our detailed guide on &lt;a href=&#34;../../concepts/patching.md&#34;&gt;Patching&lt;/a&gt;.&lt;/p&gt;&lt;p&gt;If you want to check out a course on how to use Instructor with Pydantic, check out our course on &lt;a href=&#34;https://www.wandb.courses/courses/steering-language-models&#34;&gt;Steering language models towards structured outputs.&lt;/a&gt;.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2024/03/07/open-source-local-structured-output-pydantic-json-openai/</link> <pubDate>Thu, 07 Mar 2024 00:00:00 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_created.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2024/03/07/open-source-local-structured-output-pydantic-json-openai/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/open_source.png" type="image/png" length="52260" /> </item> <item> <title>Why Instructor is the Best Library for Structured LLM Outputs</title> <author>jxnl</author> <category>llms</category> <category>python</category> <description>&lt;h1&gt;Why Instructor is the Best Library for Structured LLM Outputs&lt;/h1&gt;&lt;p&gt;Large language models (LLMs) like GPTs are incredibly powerful, but working with their open-ended text outputs can be challenging. This is where the Instructor library shines - it allows you to easily map LLM outputs to structured data using Python type annotations.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2024/03/05/zero-cost-abstractions/</link> <pubDate>Tue, 05 Mar 2024 00:00:00 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_created.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2024/03/05/zero-cost-abstractions/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/best_framework.png" type="image/png" length="52569" /> </item> <item> <title>Seamless Support with Langsmith</title> <author>jxnl</author> <category>langsmith</category> <description>&lt;h1&gt;Seamless Support with Langsmith&lt;/h1&gt;&lt;p&gt;Its a common misconception that LangChain&#39;s &lt;a href=&#34;https://www.langchain.com/langsmith&#34;&gt;LangSmith&lt;/a&gt; is only compatible with LangChain&#39;s models. In reality, LangSmith is a unified DevOps platform for developing, collaborating, testing, deploying, and monitoring LLM applications. In this blog we will explore how LangSmith can be used to enhance the OpenAI client alongside &lt;code&gt;instructor&lt;/code&gt;.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2024/02/18/seamless-support-with-langsmith/</link> <pubDate>Sun, 18 Feb 2024 00:00:00 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_created.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2024/02/18/seamless-support-with-langsmith/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/langsmith.png" type="image/png" length="40794" /> </item> <item> <title>Free course on Weights and Biases</title> <author>jxnl</author> <category>open source</category> <description>&lt;h1&gt;Free course on Weights and Biases&lt;/h1&gt;&lt;p&gt;I just released a free course on wits and biases. It goes over the material from [tutorial](../../tutorials/1-introducti...&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2024/02/14/weights-and-biases-course/</link> <pubDate>Wed, 14 Feb 2024 00:00:00 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_created.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2024/02/14/weights-and-biases-course/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/course.png" type="image/png" length="40559" /> </item> <item> <title>Introduction to Caching in Python</title> <author>jxnl</author> <category>caching</category> <category>diskcache</category> <category>functools</category> <category>python</category> <category>redis</category> <description>&lt;h1&gt;Introduction to Caching in Python&lt;/h1&gt;&lt;blockquote&gt;&lt;p&gt;Instructor makes working with language models easy, but they are still computationally expensive.&lt;/p&gt;&lt;/blockquote&gt;&lt;p&gt;Today, we&#39;re diving into optimizing instructor code while maintaining the excellent DX offered by &lt;a href=&#34;https://docs.pydantic.dev/latest/&#34;&gt;Pydantic&lt;/a&gt; models. We&#39;ll tackle the challenges of caching Pydantic models, typically incompatible with &lt;code&gt;pickle&lt;/code&gt;, and explore solutions that use &lt;code&gt;decorators&lt;/code&gt; like &lt;code&gt;functools.cache&lt;/code&gt;. Then, we&#39;ll craft custom decorators with &lt;code&gt;diskcache&lt;/code&gt; and &lt;code&gt;redis&lt;/code&gt; to support persistent caching and distributed systems.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/11/26/python-caching/</link> <pubDate>Sun, 26 Nov 2023 00:00:00 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_created.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/11/26/python-caching/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/caching.png" type="image/png" length="38621" /> </item> <item> <title>Generators and LLM Streaming</title> <author>jxnl</author> <author>anmol</author> <category>generators</category> <category>python</category> <category>streaming</category> <description>&lt;h1&gt;Generators and LLM Streaming&lt;/h1&gt;&lt;p&gt;Latency is crucial, especially in eCommerce and newer chat applications like ChatGPT. Streaming is the solution that enables us to enhance the user experience without the need for faster response times.&lt;/p&gt;&lt;p&gt;And what makes streaming possible? Generators!&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/11/26/python-generators-and-llm-streaming/</link> <pubDate>Sun, 26 Nov 2023 00:00:00 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_created.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/11/26/python-generators-and-llm-streaming/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/generator.png" type="image/png" length="41103" /> </item> <item> <title>Verifying LLM Citations with Pydantic</title> <author>jxnl</author> <category>citations</category> <category>finetuneing</category> <category>hallucination</category> <category>pydantic</category> <category>validation</category> <description>&lt;h1&gt;Verifying LLM Citations with Pydantic&lt;/h1&gt;&lt;p&gt;Ensuring the accuracy of information is crucial. This blog post explores how Pydantic&#39;s powerful and flexible validators can enhance data accuracy through citation verification.&lt;/p&gt;&lt;p&gt;We&#39;ll start with using a simple substring check to verify citations. Then we&#39;ll use &lt;code&gt;instructor&lt;/code&gt; itself to power an LLM to verify citations and align answers with the given citations. Finally, we&#39;ll explore how we can use these techniques to generate a dataset of accurate responses.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/11/18/validate-citations/</link> <pubDate>Sat, 18 Nov 2023 00:00:00 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_created.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/11/18/validate-citations/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/citations.png" type="image/png" length="47095" /> </item> <item> <title>Batch Processing OpenAI using asyncio and Instructor with Python</title> <author>jxnl</author> <category>async</category> <category>async/await</category> <category>asyncio</category> <category>batch</category> <category>python</category> <description>&lt;h1&gt;Batch Processing OpenAI using &lt;code&gt;asyncio&lt;/code&gt; and &lt;code&gt;Instructor&lt;/code&gt; with Python&lt;/h1&gt;&lt;p&gt;Today, I will introduce you to various approaches for using asyncio in Python. We will apply this to batch process data using &lt;code&gt;instructor&lt;/code&gt; and learn how to use &lt;code&gt;asyncio.gather&lt;/code&gt; and &lt;code&gt;asyncio.as_completed&lt;/code&gt; for concurrent data processing. Additionally, we will explore how to limit the number of concurrent requests to a server using &lt;code&gt;asyncio.Semaphore&lt;/code&gt;.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/11/13/learn-async/</link> <pubDate>Mon, 13 Nov 2023 00:00:00 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_created.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/11/13/learn-async/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/learn-async.png" type="image/png" length="54203" /> </item> <item> <title>Smarter Summaries w/ Finetuning GPT-3.5 and Chain of Density</title> <author>ivanleomk</author> <author>jxnl</author> <category>chain of density</category> <category>distillation</category> <category>finetuneing</category> <category>gpt-3.5-turbo</category> <category>pydantic</category> <category>validation</category> <description>&lt;h1&gt;Smarter Summaries w/ Finetuning GPT-3.5 and Chain of Density&lt;/h1&gt;&lt;blockquote&gt;&lt;p&gt;Discover how to distil an iterative method like Chain Of Density into a single finetuned model using Instructor&lt;/p&gt;&lt;/blockquote&gt;&lt;p&gt;In this article, we&#39;ll guide you through implementing the original Chain of Density method using Instructor, then show how to distile a GPT 3.5 model to match GPT-4&#39;s iterative summarization capabilities. Using these methods were able to decrease latency by 20x, reduce costs by 50x and maintain entity density.&lt;/p&gt;&lt;p&gt;By the end you&#39;ll end up with a GPT 3.5 model, (fine-tuned using Instructor&#39;s great tooling), capable of producing summaries that rival the effectiveness of Chain of Density &lt;a href=&#34;https://arxiv.org/abs/2309.04269&#34;&gt;[Adams et al. (2023)]&lt;/a&gt;. As always, all code is readily available in our &lt;code&gt;examples/chain-of-density&lt;/code&gt; folder in our repo for your reference.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/11/05/chain-of-density/</link> <pubDate>Sun, 05 Nov 2023 00:00:00 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_created.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/11/05/chain-of-density/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/chain-of-density.png" type="image/png" length="49709" /> </item> <item> <title>AI Engineer Keynote: Pydantic is all you need</title> <author>jxnl</author> <category>prompt engineering</category> <category>python</category> <category>talks</category> <category>video</category> <description>&lt;h1&gt;AI Engineer Keynote: Pydantic is all you need&lt;/h1&gt;&lt;p&gt;&lt;a href=&#34;https://www.youtube.com/watch?v=yj-wSRJwrrc&#34;&gt;&lt;img alt=&#34;Pydantic is all you need&#34; src=&#34;https://img.youtube.com/vi/yj-wSRJwrrc/0.jpg&#34;&gt;&lt;/a&gt;&lt;/p&gt;&lt;p&gt;&lt;a href=&#34;https://www.youtube.com/watch?v=yj-wSRJwrrc&#34;&gt;Click here to watch the full talk&lt;/a&gt;&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/11/02/ai-engineer-keynote-pydantic-is-all-you-need/</link> <pubDate>Thu, 02 Nov 2023 00:00:00 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_created.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/11/02/ai-engineer-keynote-pydantic-is-all-you-need/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/aisummit-2023.png" type="image/png" length="49146" /> </item> <item> <title>Good LLM Validation is Just Good Validation</title> <author>jxnl</author> <author>ivanleomk</author> <category>chain of thought</category> <category>citations</category> <category>constitutional ai</category> <category>guardrails</category> <category>pydantic</category> <category>validation</category> <description>&lt;h1&gt;Good LLM Validation is Just Good Validation&lt;/h1&gt;&lt;blockquote&gt;&lt;p&gt;What if your validation logic could learn and adapt like a human, but operate at the speed of software? This is the future of validation and it&#39;s already here.&lt;/p&gt;&lt;/blockquote&gt;&lt;p&gt;Validation is the backbone of reliable software. But traditional methods are static, rule-based, and can&#39;t adapt to new challenges. This post looks at how to bring dynamic, machine learning-driven validation into your software stack using Python libraries like &lt;code&gt;Pydantic&lt;/code&gt; and &lt;code&gt;Instructor&lt;/code&gt;. We validate these outputs using a validation function which conforms to the structure seen below.&lt;/p&gt;&lt;p&gt;&lt;code&gt;pythondef validation_function(value): if condition(value): raise ValueError(&#34;Value is not valid&#34;) return mutation(value)&lt;/code&gt;&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/10/23/good-llm-validation-is-just-good-validation/</link> <pubDate>Mon, 23 Oct 2023 00:00:00 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_created.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/10/23/good-llm-validation-is-just-good-validation/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/validation-part1.png" type="image/png" length="45840" /> </item> <item> <title>Enhancing Python Functions with Instructor: A Guide to Fine-Tuning and Distillation</title> <author>jxnl</author> <category>distillation</category> <category>finetuning</category> <category>function calling</category> <category>python</category> <description>&lt;h1&gt;Enhancing Python Functions with Instructor: A Guide to Fine-Tuning and Distillation&lt;/h1&gt;&lt;h2&gt;Introduction&lt;/h2&gt;&lt;p&gt;Get ready to dive deep into the world of fine-tuning task specific language models with Python functions. We&#39;ll explore how the &lt;code&gt;instructor.instructions&lt;/code&gt; streamlines this process, making the task you want to distil more efficient and powerful while preserving its original functionality and backwards compatibility.&lt;/p&gt;&lt;p&gt;If you want to see the full example checkout &lt;a href=&#34;https://github.com/jxnl/instructor/tree/main/examples/distilations&#34;&gt;examples/distillation&lt;/a&gt;&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/10/17/enhancing-python-functions-with-instructor-a-guide-to-fine-tuning-and-distillation/</link> <pubDate>Tue, 17 Oct 2023 00:00:00 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_created.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/10/17/enhancing-python-functions-with-instructor-a-guide-to-fine-tuning-and-distillation/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/distilation-part1.png" type="image/png" length="52529" /> </item> <item> <title>RAG is more than just embedding search</title> <author>jxnl</author> <category>Embeddings</category> <category>Personal Assistant</category> <category>Query Understanding</category> <category>RAG</category> <category>Search Systems</category> <description>&lt;h1&gt;RAG is more than just embedding search&lt;/h1&gt;&lt;p&gt;With the advent of large language models (LLM), retrieval augmented generation (RAG) has become a hot topic. However throughout the past year of &lt;a href=&#34;https://jxnl.co&#34;&gt;helping startups&lt;/a&gt; integrate LLMs into their stack I&#39;ve noticed that the pattern of taking user queries, embedding them, and directly searching a vector store is effectively demoware.&lt;/p&gt;&lt;p&gt;!!! note &#34;What is RAG?&#34;&lt;/p&gt;&lt;pre&gt;&lt;code&gt;Retrieval augmented generation (RAG) is a technique that uses an LLM to generate responses, but uses a search backend to augment the generation. In the past year using text embeddings with a vector databases has been the most popular approach I&#39;ve seen being socialized.&lt;/code&gt;&lt;/pre&gt;&lt;figure markdown&gt; ![RAG](img/dumb_rag.png) &lt;figcaption&gt;Simple RAG that embedded the user query and makes a search.&lt;/figcaption&gt;&lt;/figure&gt;&lt;p&gt;So let&#39;s kick things off by examining what I like to call the &#39;Dumb&#39; RAG Model—a basic setup that&#39;s more common than you&#39;d think.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/09/17/rag-is-more-than-just-embedding-search/</link> <pubDate>Sun, 17 Sep 2023 00:00:00 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_created.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/09/17/rag-is-more-than-just-embedding-search/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/rag-and-beyond.png" type="image/png" length="50301" /> </item> <item> <title>Generating Structured Output / JSON from LLMs</title> <author>jxnl</author> <category>Introduction</category> <description>&lt;h1&gt;Generating Structured Output / JSON from LLMs&lt;/h1&gt;&lt;p&gt;Language models have seen significant growth. Using them effectively often requires complex frameworks. This post discusses how Instructor simplifies this process using Pydantic.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/09/11/generating-structured-output--json-from-llms/</link> <pubDate>Mon, 11 Sep 2023 00:00:00 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_created.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/09/11/generating-structured-output--json-from-llms/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/introduction.png" type="image/png" length="52381" /> </item> </channel></rss>
\ No newline at end of file
diff --git a/feed_rss_updated.xml b/feed_rss_updated.xml
deleted file mode 100644
index fa69592a6..000000000
--- a/feed_rss_updated.xml
+++ /dev/null
@@ -1 +0,0 @@
-<?xml version="1.0" encoding="UTF-8" ?><rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom" xmlns:dc="http://purl.org/dc/elements/1.1/"> <channel><title>Instructor</title><description>A lightweight library for structured outputs with LLMs.</description><link>https://jxnl.github.io/instructor/</link><atom:link href="https://jxnl.github.io/instructor/feed_rss_updated.xml" rel="self" type="application/rss+xml" /><managingEditor>Jason Liu</managingEditor><docs>https://github.com/jxnl/instructor/</docs><language>en</language> <pubDate>Tue, 12 Mar 2024 02:47:04 -0000</pubDate> <lastBuildDate>Tue, 12 Mar 2024 02:47:04 -0000</lastBuildDate> <ttl>1440</ttl> <generator>MkDocs RSS plugin - v1.12.1</generator> <item> <title>AI Engineer Keynote: Pydantic is all you need</title> <author>jxnl</author> <category>prompt engineering</category> <category>python</category> <category>talks</category> <category>video</category> <description>&lt;h1&gt;AI Engineer Keynote: Pydantic is all you need&lt;/h1&gt;&lt;p&gt;&lt;a href=&#34;https://www.youtube.com/watch?v=yj-wSRJwrrc&#34;&gt;&lt;img alt=&#34;Pydantic is all you need&#34; src=&#34;https://img.youtube.com/vi/yj-wSRJwrrc/0.jpg&#34;&gt;&lt;/a&gt;&lt;/p&gt;&lt;p&gt;&lt;a href=&#34;https://www.youtube.com/watch?v=yj-wSRJwrrc&#34;&gt;Click here to watch the full talk&lt;/a&gt;&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/11/02/ai-engineer-keynote-pydantic-is-all-you-need/</link> <pubDate>Tue, 12 Mar 2024 02:46:20 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_updated.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/11/02/ai-engineer-keynote-pydantic-is-all-you-need/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/aisummit-2023.png" type="image/png" length="49146" /> </item> <item> <title>Why Instructor is the Best Library for Structured LLM Outputs</title> <author>jxnl</author> <category>llms</category> <category>python</category> <description>&lt;h1&gt;Why Instructor is the Best Library for Structured LLM Outputs&lt;/h1&gt;&lt;p&gt;Large language models (LLMs) like GPTs are incredibly powerful, but working with their open-ended text outputs can be challenging. This is where the Instructor library shines - it allows you to easily map LLM outputs to structured data using Python type annotations.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2024/03/05/zero-cost-abstractions/</link> <pubDate>Tue, 12 Mar 2024 02:46:20 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_updated.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2024/03/05/zero-cost-abstractions/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/best_framework.png" type="image/png" length="52569" /> </item> <item> <title>Introduction to Caching in Python</title> <author>jxnl</author> <category>caching</category> <category>diskcache</category> <category>functools</category> <category>python</category> <category>redis</category> <description>&lt;h1&gt;Introduction to Caching in Python&lt;/h1&gt;&lt;blockquote&gt;&lt;p&gt;Instructor makes working with language models easy, but they are still computationally expensive.&lt;/p&gt;&lt;/blockquote&gt;&lt;p&gt;Today, we&#39;re diving into optimizing instructor code while maintaining the excellent DX offered by &lt;a href=&#34;https://docs.pydantic.dev/latest/&#34;&gt;Pydantic&lt;/a&gt; models. We&#39;ll tackle the challenges of caching Pydantic models, typically incompatible with &lt;code&gt;pickle&lt;/code&gt;, and explore solutions that use &lt;code&gt;decorators&lt;/code&gt; like &lt;code&gt;functools.cache&lt;/code&gt;. Then, we&#39;ll craft custom decorators with &lt;code&gt;diskcache&lt;/code&gt; and &lt;code&gt;redis&lt;/code&gt; to support persistent caching and distributed systems.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/11/26/python-caching/</link> <pubDate>Tue, 12 Mar 2024 02:46:20 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_updated.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/11/26/python-caching/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/caching.png" type="image/png" length="38621" /> </item> <item> <title>Smarter Summaries w/ Finetuning GPT-3.5 and Chain of Density</title> <author>ivanleomk</author> <author>jxnl</author> <category>chain of density</category> <category>distillation</category> <category>finetuneing</category> <category>gpt-3.5-turbo</category> <category>pydantic</category> <category>validation</category> <description>&lt;h1&gt;Smarter Summaries w/ Finetuning GPT-3.5 and Chain of Density&lt;/h1&gt;&lt;blockquote&gt;&lt;p&gt;Discover how to distil an iterative method like Chain Of Density into a single finetuned model using Instructor&lt;/p&gt;&lt;/blockquote&gt;&lt;p&gt;In this article, we&#39;ll guide you through implementing the original Chain of Density method using Instructor, then show how to distile a GPT 3.5 model to match GPT-4&#39;s iterative summarization capabilities. Using these methods were able to decrease latency by 20x, reduce costs by 50x and maintain entity density.&lt;/p&gt;&lt;p&gt;By the end you&#39;ll end up with a GPT 3.5 model, (fine-tuned using Instructor&#39;s great tooling), capable of producing summaries that rival the effectiveness of Chain of Density &lt;a href=&#34;https://arxiv.org/abs/2309.04269&#34;&gt;[Adams et al. (2023)]&lt;/a&gt;. As always, all code is readily available in our &lt;code&gt;examples/chain-of-density&lt;/code&gt; folder in our repo for your reference.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/11/05/chain-of-density/</link> <pubDate>Tue, 12 Mar 2024 02:46:20 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_updated.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/11/05/chain-of-density/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/chain-of-density.png" type="image/png" length="49709" /> </item> <item> <title>Verifying LLM Citations with Pydantic</title> <author>jxnl</author> <category>citations</category> <category>finetuneing</category> <category>hallucination</category> <category>pydantic</category> <category>validation</category> <description>&lt;h1&gt;Verifying LLM Citations with Pydantic&lt;/h1&gt;&lt;p&gt;Ensuring the accuracy of information is crucial. This blog post explores how Pydantic&#39;s powerful and flexible validators can enhance data accuracy through citation verification.&lt;/p&gt;&lt;p&gt;We&#39;ll start with using a simple substring check to verify citations. Then we&#39;ll use &lt;code&gt;instructor&lt;/code&gt; itself to power an LLM to verify citations and align answers with the given citations. Finally, we&#39;ll explore how we can use these techniques to generate a dataset of accurate responses.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/11/18/validate-citations/</link> <pubDate>Tue, 12 Mar 2024 02:46:20 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_updated.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/11/18/validate-citations/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/citations.png" type="image/png" length="47095" /> </item> <item> <title>Free course on Weights and Biases</title> <author>jxnl</author> <category>open source</category> <description>&lt;h1&gt;Free course on Weights and Biases&lt;/h1&gt;&lt;p&gt;I just released a free course on wits and biases. It goes over the material from [tutorial](../../tutorials/1-introducti...&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2024/02/14/weights-and-biases-course/</link> <pubDate>Tue, 12 Mar 2024 02:46:20 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_updated.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2024/02/14/weights-and-biases-course/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/course.png" type="image/png" length="40559" /> </item> <item> <title>Enhancing Python Functions with Instructor: A Guide to Fine-Tuning and Distillation</title> <author>jxnl</author> <category>distillation</category> <category>finetuning</category> <category>function calling</category> <category>python</category> <description>&lt;h1&gt;Enhancing Python Functions with Instructor: A Guide to Fine-Tuning and Distillation&lt;/h1&gt;&lt;h2&gt;Introduction&lt;/h2&gt;&lt;p&gt;Get ready to dive deep into the world of fine-tuning task specific language models with Python functions. We&#39;ll explore how the &lt;code&gt;instructor.instructions&lt;/code&gt; streamlines this process, making the task you want to distil more efficient and powerful while preserving its original functionality and backwards compatibility.&lt;/p&gt;&lt;p&gt;If you want to see the full example checkout &lt;a href=&#34;https://github.com/jxnl/instructor/tree/main/examples/distilations&#34;&gt;examples/distillation&lt;/a&gt;&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/10/17/enhancing-python-functions-with-instructor-a-guide-to-fine-tuning-and-distillation/</link> <pubDate>Tue, 12 Mar 2024 02:46:20 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_updated.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/10/17/enhancing-python-functions-with-instructor-a-guide-to-fine-tuning-and-distillation/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/distilation-part1.png" type="image/png" length="52529" /> </item> <item> <title>Simple Synthetic Data Generation</title> <author>jxnl</author> <description>&lt;h1&gt;Simple Synthetic Data Generation&lt;/h1&gt;&lt;p&gt;What that people have been using instructor for is to generate synthetic data rather than extracting data itself. We can ...&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2024/03/08/simple-synthetic-data-generation/</link> <pubDate>Tue, 12 Mar 2024 02:46:20 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_updated.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2024/03/08/simple-synthetic-data-generation/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/fake-data.png" type="image/png" length="39736" /> </item> <item> <title>Generators and LLM Streaming</title> <author>jxnl</author> <author>anmol</author> <category>generators</category> <category>python</category> <category>streaming</category> <description>&lt;h1&gt;Generators and LLM Streaming&lt;/h1&gt;&lt;p&gt;Latency is crucial, especially in eCommerce and newer chat applications like ChatGPT. Streaming is the solution that enables us to enhance the user experience without the need for faster response times.&lt;/p&gt;&lt;p&gt;And what makes streaming possible? Generators!&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/11/26/python-generators-and-llm-streaming/</link> <pubDate>Tue, 12 Mar 2024 02:46:20 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_updated.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/11/26/python-generators-and-llm-streaming/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/generator.png" type="image/png" length="41103" /> </item> <item> <title>Generating Structured Output / JSON from LLMs</title> <author>jxnl</author> <category>Introduction</category> <description>&lt;h1&gt;Generating Structured Output / JSON from LLMs&lt;/h1&gt;&lt;p&gt;Language models have seen significant growth. Using them effectively often requires complex frameworks. This post discusses how Instructor simplifies this process using Pydantic.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/09/11/generating-structured-output--json-from-llms/</link> <pubDate>Tue, 12 Mar 2024 02:46:20 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_updated.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/09/11/generating-structured-output--json-from-llms/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/introduction.png" type="image/png" length="52381" /> </item> <item> <title>Seamless Support with Langsmith</title> <author>jxnl</author> <category>langsmith</category> <description>&lt;h1&gt;Seamless Support with Langsmith&lt;/h1&gt;&lt;p&gt;Its a common misconception that LangChain&#39;s &lt;a href=&#34;https://www.langchain.com/langsmith&#34;&gt;LangSmith&lt;/a&gt; is only compatible with LangChain&#39;s models. In reality, LangSmith is a unified DevOps platform for developing, collaborating, testing, deploying, and monitoring LLM applications. In this blog we will explore how LangSmith can be used to enhance the OpenAI client alongside &lt;code&gt;instructor&lt;/code&gt;.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2024/02/18/seamless-support-with-langsmith/</link> <pubDate>Tue, 12 Mar 2024 02:46:20 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_updated.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2024/02/18/seamless-support-with-langsmith/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/langsmith.png" type="image/png" length="40794" /> </item> <item> <title>Batch Processing OpenAI using asyncio and Instructor with Python</title> <author>jxnl</author> <category>async</category> <category>async/await</category> <category>asyncio</category> <category>batch</category> <category>python</category> <description>&lt;h1&gt;Batch Processing OpenAI using &lt;code&gt;asyncio&lt;/code&gt; and &lt;code&gt;Instructor&lt;/code&gt; with Python&lt;/h1&gt;&lt;p&gt;Today, I will introduce you to various approaches for using asyncio in Python. We will apply this to batch process data using &lt;code&gt;instructor&lt;/code&gt; and learn how to use &lt;code&gt;asyncio.gather&lt;/code&gt; and &lt;code&gt;asyncio.as_completed&lt;/code&gt; for concurrent data processing. Additionally, we will explore how to limit the number of concurrent requests to a server using &lt;code&gt;asyncio.Semaphore&lt;/code&gt;.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/11/13/learn-async/</link> <pubDate>Tue, 12 Mar 2024 02:46:20 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_updated.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/11/13/learn-async/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/learn-async.png" type="image/png" length="54203" /> </item> <item> <title>Structured Output for Open Source and Local LLMS</title> <author>jxnl</author> <category>anyscale</category> <category>groq</category> <category>llama-cpp-python</category> <category>llms</category> <category>mistral</category> <category>ollama</category> <category>opensource</category> <category>together</category> <description>&lt;h1&gt;Structured Output for Open Source and Local LLMS&lt;/h1&gt;&lt;p&gt;Originally, Instructor facilitated API interactions solely via the OpenAI SDK, with an emphasis on function call by incorporating &lt;a href=&#34;https://pydantic-docs.helpmanual.io/&#34;&gt;Pydantic&lt;/a&gt; for structured data validation and serialization. &lt;/p&gt;&lt;p&gt;As the year progressed, we expanded our toolkit by integrating &lt;a href=&#34;../../concepts/patching.md#json-mode&#34;&gt;JSON mode&lt;/a&gt;, thus enhancing our adaptability to vision models and open source models. This advancement now enables us to support an extensive range of models, from &lt;a href=&#34;https://openai.com/api/&#34;&gt;GPT&lt;/a&gt; and &lt;a href=&#34;https://mistral.ai&#34;&gt;Mistral&lt;/a&gt; to virtually any model accessible through &lt;a href=&#34;https://ollama.ai&#34;&gt;Ollama&lt;/a&gt; and &lt;a href=&#34;https://huggingface.co/models&#34;&gt;Hugging Face&lt;/a&gt;, facilitated by &lt;a href=&#34;../../hub/llama-cpp-python.md&#34;&gt;llama-cpp-python&lt;/a&gt;. For more insights into leveraging JSON mode with various models, refer back to our detailed guide on &lt;a href=&#34;../../concepts/patching.md&#34;&gt;Patching&lt;/a&gt;.&lt;/p&gt;&lt;p&gt;If you want to check out a course on how to use Instructor with Pydantic, check out our course on &lt;a href=&#34;https://www.wandb.courses/courses/steering-language-models&#34;&gt;Steering language models towards structured outputs.&lt;/a&gt;.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2024/03/07/open-source-local-structured-output-pydantic-json-openai/</link> <pubDate>Tue, 12 Mar 2024 02:46:20 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_updated.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2024/03/07/open-source-local-structured-output-pydantic-json-openai/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/open_source.png" type="image/png" length="52260" /> </item> <item> <title>RAG is more than just embedding search</title> <author>jxnl</author> <category>Embeddings</category> <category>Personal Assistant</category> <category>Query Understanding</category> <category>RAG</category> <category>Search Systems</category> <description>&lt;h1&gt;RAG is more than just embedding search&lt;/h1&gt;&lt;p&gt;With the advent of large language models (LLM), retrieval augmented generation (RAG) has become a hot topic. However throughout the past year of &lt;a href=&#34;https://jxnl.co&#34;&gt;helping startups&lt;/a&gt; integrate LLMs into their stack I&#39;ve noticed that the pattern of taking user queries, embedding them, and directly searching a vector store is effectively demoware.&lt;/p&gt;&lt;p&gt;!!! note &#34;What is RAG?&#34;&lt;/p&gt;&lt;pre&gt;&lt;code&gt;Retrieval augmented generation (RAG) is a technique that uses an LLM to generate responses, but uses a search backend to augment the generation. In the past year using text embeddings with a vector databases has been the most popular approach I&#39;ve seen being socialized.&lt;/code&gt;&lt;/pre&gt;&lt;figure markdown&gt; ![RAG](img/dumb_rag.png) &lt;figcaption&gt;Simple RAG that embedded the user query and makes a search.&lt;/figcaption&gt;&lt;/figure&gt;&lt;p&gt;So let&#39;s kick things off by examining what I like to call the &#39;Dumb&#39; RAG Model—a basic setup that&#39;s more common than you&#39;d think.&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/09/17/rag-is-more-than-just-embedding-search/</link> <pubDate>Tue, 12 Mar 2024 02:46:20 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_updated.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/09/17/rag-is-more-than-just-embedding-search/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/rag-and-beyond.png" type="image/png" length="50301" /> </item> <item> <title>Good LLM Validation is Just Good Validation</title> <author>jxnl</author> <author>ivanleomk</author> <category>chain of thought</category> <category>citations</category> <category>constitutional ai</category> <category>guardrails</category> <category>pydantic</category> <category>validation</category> <description>&lt;h1&gt;Good LLM Validation is Just Good Validation&lt;/h1&gt;&lt;blockquote&gt;&lt;p&gt;What if your validation logic could learn and adapt like a human, but operate at the speed of software? This is the future of validation and it&#39;s already here.&lt;/p&gt;&lt;/blockquote&gt;&lt;p&gt;Validation is the backbone of reliable software. But traditional methods are static, rule-based, and can&#39;t adapt to new challenges. This post looks at how to bring dynamic, machine learning-driven validation into your software stack using Python libraries like &lt;code&gt;Pydantic&lt;/code&gt; and &lt;code&gt;Instructor&lt;/code&gt;. We validate these outputs using a validation function which conforms to the structure seen below.&lt;/p&gt;&lt;p&gt;&lt;code&gt;pythondef validation_function(value): if condition(value): raise ValueError(&#34;Value is not valid&#34;) return mutation(value)&lt;/code&gt;&lt;/p&gt;</description><link>https://jxnl.github.io/instructor/blog/2023/10/23/good-llm-validation-is-just-good-validation/</link> <pubDate>Tue, 12 Mar 2024 02:46:20 +0000</pubDate><source url="https://jxnl.github.io/instructor/feed_rss_updated.xml">Instructor</source><guid isPermaLink="true">https://jxnl.github.io/instructor/blog/2023/10/23/good-llm-validation-is-just-good-validation/</guid> <enclosure url="https://jxnl.github.io/instructor/assets/images/social/blog/posts/validation-part1.png" type="image/png" length="45840" /> </item> </channel></rss>
\ No newline at end of file
diff --git a/sitemap.xml.gz b/sitemap.xml.gz
index 02cf8a92a..a6e865ae8 100644
Binary files a/sitemap.xml.gz and b/sitemap.xml.gz differ