<?xml version="1.0" encoding="UTF-8"?><rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	
	xmlns:georss="http://www.georss.org/georss"
	xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#"
	>

<channel>
	<title>AI - Inero Software - Software Consulting</title>
	<atom:link href="https://inero-software.com/category/ai/feed/" rel="self" type="application/rss+xml" />
	<link>https://inero-software.com/category/ai/</link>
	<description>We unleash innovations using cutting-edge technologies, modern design and AI</description>
	<lastBuildDate>Mon, 17 Nov 2025 12:21:20 +0000</lastBuildDate>
	<language>en-GB</language>
	<sy:updatePeriod>
	hourly	</sy:updatePeriod>
	<sy:updateFrequency>
	1	</sy:updateFrequency>
	<generator>https://wordpress.org/?v=6.9.1</generator>

<image>
	<url>https://inero-software.com/wp-content/uploads/2018/11/inero-logo-favicon.png</url>
	<title>AI - Inero Software - Software Consulting</title>
	<link>https://inero-software.com/category/ai/</link>
	<width>32</width>
	<height>32</height>
</image> 
<site xmlns="com-wordpress:feed-additions:1">153509928</site>	<item>
		<title>Implementing an AI-Powered Telephony Service Center with ElevenLabs &#038; LiveAPI</title>
		<link>https://inero-software.com/enterprise-ai-telephony/</link>
		
		<dc:creator><![CDATA[Andrzej Chybicki]]></dc:creator>
		<pubDate>Mon, 17 Nov 2025 11:18:27 +0000</pubDate>
				<category><![CDATA[AI]]></category>
		<category><![CDATA[Blog]]></category>
		<category><![CDATA[Company]]></category>
		<category><![CDATA[Technology]]></category>
		<category><![CDATA[AI call center]]></category>
		<category><![CDATA[AI telephony]]></category>
		<category><![CDATA[AI voice pipelines]]></category>
		<category><![CDATA[conversational AI]]></category>
		<category><![CDATA[enterprise AI]]></category>
		<category><![CDATA[GDPR compliance]]></category>
		<category><![CDATA[LiveAPI]]></category>
		<category><![CDATA[LLM voice interfaces]]></category>
		<category><![CDATA[real-time voice systems]]></category>
		<category><![CDATA[streaming AI;]]></category>
		<category><![CDATA[telephony integration]]></category>
		<category><![CDATA[voice automation]]></category>
		<guid isPermaLink="false">https://inero-software.com/?p=8238</guid>

					<description><![CDATA[<p>Implementing an AI-Powered Telephony Service Center with ElevenLabs &#38; LiveAPI Over the past year, advancements in real-time AI models and high‑fidelity speech synthesis have accelerated the development of AI-driven telephony systems. At Inero, we’ve had the opportunity to integrate modern telephony solutions with LiveAPI technology and ElevenLabs’ voice engine to&#8230;</p>
<p>Artykuł <a href="https://inero-software.com/enterprise-ai-telephony/">Implementing an AI-Powered Telephony Service Center with ElevenLabs &#038; LiveAPI</a> pochodzi z serwisu <a href="https://inero-software.com">Inero Software - Software Consulting</a>.</p>
]]></description>
										<content:encoded><![CDATA[		<div data-elementor-type="wp-post" data-elementor-id="8238" class="elementor elementor-8238" data-elementor-post-type="post">
				<div class="elementor-element elementor-element-44c8f7e e-flex e-con-boxed e-con e-parent" data-id="44c8f7e" data-element_type="container">
					<div class="e-con-inner">
				<div class="elementor-element elementor-element-cfa815a elementor-widget elementor-widget-spacer" data-id="cfa815a" data-element_type="widget" data-widget_type="spacer.default">
				<div class="elementor-widget-container">
					<div class="elementor-spacer">
			<div class="elementor-spacer-inner"></div>
		</div>
				</div>
				</div>
					</div>
				</div>
		<div class="elementor-element elementor-element-6cc775b e-flex e-con-boxed e-con e-parent" data-id="6cc775b" data-element_type="container">
					<div class="e-con-inner">
		<div class="elementor-element elementor-element-ad26502 e-con-full e-flex e-con e-child" data-id="ad26502" data-element_type="container">
				</div>
		<div class="elementor-element elementor-element-4974bf1 e-con-full e-flex e-con e-child" data-id="4974bf1" data-element_type="container">
				<div class="elementor-element elementor-element-dc50676 elementor-widget elementor-widget-text-editor" data-id="dc50676" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h1><span lang="EN-US">Implementing an AI-Powered Telephony Service Center with ElevenLabs &amp; LiveAPI</span></h1><p> </p><p class="MsoNormal"><span lang="EN-US">Over the past year, advancements in real-time AI models and high‑fidelity speech synthesis have accelerated the development of AI-driven telephony systems. At Inero, we’ve had the opportunity to integrate modern telephony solutions with LiveAPI technology and ElevenLabs’ voice engine to create a human‑like, responsive, GDPR‑compliant communication experience for a major corporate client.<br /><br />This article combines two perspectives: a high-level overview of LiveAPI and ElevenLabs technology, and a behind‑the‑scenes look at our practical engineering experience while delivering a real-world AI telephony solution.</span></p>						</div>
				</div>
				</div>
		<div class="elementor-element elementor-element-5ab22b7 e-con-full e-flex e-con e-child" data-id="5ab22b7" data-element_type="container">
				</div>
					</div>
				</div>
		<div class="elementor-element elementor-element-0150de1 e-flex e-con-boxed e-con e-parent" data-id="0150de1" data-element_type="container">
					<div class="e-con-inner">
		<div class="elementor-element elementor-element-e45f203 e-con-full e-flex e-con e-child" data-id="e45f203" data-element_type="container">
				</div>
		<div class="elementor-element elementor-element-a617588 e-con-full e-flex e-con e-child" data-id="a617588" data-element_type="container">
				<div class="elementor-element elementor-element-83d612c elementor-widget elementor-widget-spacer" data-id="83d612c" data-element_type="widget" data-widget_type="spacer.default">
				<div class="elementor-widget-container">
					<div class="elementor-spacer">
			<div class="elementor-spacer-inner"></div>
		</div>
				</div>
				</div>
				<div class="elementor-element elementor-element-e0cafc0 elementor-widget elementor-widget-text-editor" data-id="e0cafc0" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h2><span lang="EN-US">1. What Makes LiveAPI and ElevenLabs a Powerful Combination?</span></h2><p> </p><p class="MsoNormal"><span lang="EN-US">LiveAPI solutions such as OpenAI Realtime API and Google Gemini Live API shift the paradigm from static prompts to streaming, interactive communication. These systems support real‑time audio input, low‑latency responses, natural interrupt handling, and multimodal context.<br /><br />ElevenLabs complements this with industry‑leading voice synthesis. Its realistic, expressive voices and advanced prosody control enable AI agents that sound convincingly human. For telephony environments, this matters — clients expect clarity, confidence, and a pleasant conversational tone.</span></p>						</div>
				</div>
		<div class="elementor-element elementor-element-275490b e-con-full e-flex e-con e-child" data-id="275490b" data-element_type="container">
				<div class="elementor-element elementor-element-b98492a elementor-widget elementor-widget-image" data-id="b98492a" data-element_type="widget" data-widget_type="image.default">
				<div class="elementor-widget-container">
													<img fetchpriority="high" decoding="async" data-attachment-id="8251" data-permalink="https://inero-software.com/enterprise-ai-telephony/liveapi_elevenlabs_interactionmodel/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/11/LiveAPI_ElevenLabs_InteractionModel.png" data-orig-size="1536,1024" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="LiveAPI + ElevenLabs Interaction Model" data-image-description="&lt;p&gt;A clean, purple-themed diagram visualizing the data flow in an AI-powered telephony system. The graphic illustrates how a user speaks into a microphone, how the audio is processed by a LiveAPI voice LLM, and how the response is synthesized by ElevenLabs TTS before returning to the user as speech. The design represents a real-time, low-latency interaction loop used in modern conversational AI and telephony integrations.&lt;/p&gt;
" data-image-caption="&lt;p&gt;How user audio flows through LiveAPI and ElevenLabs TTS to create real-time voice responses.&lt;/p&gt;
" data-medium-file="https://inero-software.com/wp-content/uploads/2025/11/LiveAPI_ElevenLabs_InteractionModel-300x200.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/11/LiveAPI_ElevenLabs_InteractionModel-1030x687.png" tabindex="0" role="button" width="1030" height="687" src="https://inero-software.com/wp-content/uploads/2025/11/LiveAPI_ElevenLabs_InteractionModel-1030x687.png" class="attachment-large size-large wp-image-8251" alt="Diagram showing the interaction flow between a user, a LiveAPI voice model, and ElevenLabs TTS in a real-time AI telephony system." srcset="https://inero-software.com/wp-content/uploads/2025/11/LiveAPI_ElevenLabs_InteractionModel-1030x687.png 1030w, https://inero-software.com/wp-content/uploads/2025/11/LiveAPI_ElevenLabs_InteractionModel-300x200.png 300w, https://inero-software.com/wp-content/uploads/2025/11/LiveAPI_ElevenLabs_InteractionModel-768x512.png 768w, https://inero-software.com/wp-content/uploads/2025/11/LiveAPI_ElevenLabs_InteractionModel-450x300.png 450w, https://inero-software.com/wp-content/uploads/2025/11/LiveAPI_ElevenLabs_InteractionModel.png 1536w" sizes="(max-width: 1030px) 100vw, 1030px" data-attachment-id="8251" data-permalink="https://inero-software.com/enterprise-ai-telephony/liveapi_elevenlabs_interactionmodel/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/11/LiveAPI_ElevenLabs_InteractionModel.png" data-orig-size="1536,1024" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="LiveAPI + ElevenLabs Interaction Model" data-image-description="&lt;p&gt;A clean, purple-themed diagram visualizing the data flow in an AI-powered telephony system. The graphic illustrates how a user speaks into a microphone, how the audio is processed by a LiveAPI voice LLM, and how the response is synthesized by ElevenLabs TTS before returning to the user as speech. The design represents a real-time, low-latency interaction loop used in modern conversational AI and telephony integrations.&lt;/p&gt;
" data-image-caption="&lt;p&gt;How user audio flows through LiveAPI and ElevenLabs TTS to create real-time voice responses.&lt;/p&gt;
" data-medium-file="https://inero-software.com/wp-content/uploads/2025/11/LiveAPI_ElevenLabs_InteractionModel-300x200.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/11/LiveAPI_ElevenLabs_InteractionModel-1030x687.png" role="button" />													</div>
				</div>
				</div>
				</div>
		<div class="elementor-element elementor-element-ca7edd1 e-con-full e-flex e-con e-child" data-id="ca7edd1" data-element_type="container">
				</div>
					</div>
				</div>
		<div class="elementor-element elementor-element-3553e31 e-flex e-con-boxed e-con e-parent" data-id="3553e31" data-element_type="container">
					<div class="e-con-inner">
		<div class="elementor-element elementor-element-4d3148a e-con-full e-flex e-con e-child" data-id="4d3148a" data-element_type="container">
				</div>
		<div class="elementor-element elementor-element-5d07d44 e-con-full e-flex e-con e-child" data-id="5d07d44" data-element_type="container">
				<div class="elementor-element elementor-element-1a97268 elementor-widget elementor-widget-spacer" data-id="1a97268" data-element_type="widget" data-widget_type="spacer.default">
				<div class="elementor-widget-container">
					<div class="elementor-spacer">
			<div class="elementor-spacer-inner"></div>
		</div>
				</div>
				</div>
				<div class="elementor-element elementor-element-02ef01f elementor-widget elementor-widget-text-editor" data-id="02ef01f" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h2><span lang="EN-US">2. Why GDPR Compliance Shapes the Choice of API in Europe</span></h2><p class="MsoNormal"><span lang="EN-US">For European organisations, GDPR compliance is not optional — it defines which AI vendors can be used in production. Although both OpenAI and Google offer real-time APIs, enterprises operating in the EU often restrict use to providers ensuring transparent, EU‑aligned data governance. In practice, this means that Gemini Live API was the viable choice for our implementation, while OpenAI was excluded despite strong technical capabilities.</span></p>						</div>
				</div>
				</div>
		<div class="elementor-element elementor-element-b6d89f4 e-con-full e-flex e-con e-child" data-id="b6d89f4" data-element_type="container">
				</div>
					</div>
				</div>
		<div class="elementor-element elementor-element-edad7b5 e-flex e-con-boxed e-con e-parent" data-id="edad7b5" data-element_type="container">
					<div class="e-con-inner">
		<div class="elementor-element elementor-element-8da2a35 e-con-full e-flex e-con e-child" data-id="8da2a35" data-element_type="container">
				</div>
		<div class="elementor-element elementor-element-6d9a181 e-con-full e-flex e-con e-child" data-id="6d9a181" data-element_type="container">
				<div class="elementor-element elementor-element-567ff66 elementor-widget elementor-widget-spacer" data-id="567ff66" data-element_type="widget" data-widget_type="spacer.default">
				<div class="elementor-widget-container">
					<div class="elementor-spacer">
			<div class="elementor-spacer-inner"></div>
		</div>
				</div>
				</div>
				<div class="elementor-element elementor-element-f5c5517 elementor-widget elementor-widget-text-editor" data-id="f5c5517" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h2><span lang="EN-US">3. Our Practical Experience Integrating Telephony with LiveAPI and ElevenLabs</span></h2><p class="MsoNormal"><span lang="EN-US">Below we outline the key lessons, challenges, and engineering decisions from our implementation.</span></p><p class="MsoNormal"><span lang="EN-US"> </span></p><h3><span lang="EN-US">3.1 Project Context</span></h3><p class="MsoNormal"><span lang="EN-US">Our client — a large corporate organisation — required a system capable of handling outbound and inbound calls automatically, while maintaining a tone and responsiveness extremely close to human interaction. The goal was not a simple IVR or menu system, but a natural, fully conversational experience driven by real‑time AI.</span></p><p class="MsoNormal"><span lang="EN-US"> </span></p><h3><span lang="EN-US">3.2 Technology Stack and Constraints</span></h3><p class="MsoNormal"><span lang="EN-US">We evaluated both OpenAI and Gemini Live APIs to compare latency, contextual reasoning and streaming quality. However, due to GDPR compliance requirements, the production system was designed around Gemini Live API. ElevenLabs provided the speech synthesis layer, offering high realism and consistent quality across telephony channels.</span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-a79ca65 elementor-widget elementor-widget-image" data-id="a79ca65" data-element_type="widget" data-widget_type="image.default">
				<div class="elementor-widget-container">
													<img decoding="async" data-attachment-id="8260" data-permalink="https://inero-software.com/enterprise-ai-telephony/telephony_elevenlabs_pipeline-2/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/11/Telephony_ElevenLabs_Pipeline-1.png" data-orig-size="1536,1024" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="AI Telephony Pipleine" data-image-description="&lt;p&gt;Diagram showing the processing pipeline from telephony audio through LiveAPI to ElevenLabs TTS in an AI-powered voice system.&lt;/p&gt;
" data-image-caption="&lt;p&gt;Diagram showing the processing pipeline from telephony audio through LiveAPI to ElevenLabs TTS in an AI-powered voice system.&lt;/p&gt;
" data-medium-file="https://inero-software.com/wp-content/uploads/2025/11/Telephony_ElevenLabs_Pipeline-1-300x200.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/11/Telephony_ElevenLabs_Pipeline-1-1030x687.png" tabindex="0" role="button" width="768" height="512" src="https://inero-software.com/wp-content/uploads/2025/11/Telephony_ElevenLabs_Pipeline-1-768x512.png" class="attachment-medium_large size-medium_large wp-image-8260" alt="Telephony with AI Processing Pipeline" srcset="https://inero-software.com/wp-content/uploads/2025/11/Telephony_ElevenLabs_Pipeline-1-768x512.png 768w, https://inero-software.com/wp-content/uploads/2025/11/Telephony_ElevenLabs_Pipeline-1-300x200.png 300w, https://inero-software.com/wp-content/uploads/2025/11/Telephony_ElevenLabs_Pipeline-1-1030x687.png 1030w, https://inero-software.com/wp-content/uploads/2025/11/Telephony_ElevenLabs_Pipeline-1.png 1536w" sizes="(max-width: 768px) 100vw, 768px" data-attachment-id="8260" data-permalink="https://inero-software.com/enterprise-ai-telephony/telephony_elevenlabs_pipeline-2/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/11/Telephony_ElevenLabs_Pipeline-1.png" data-orig-size="1536,1024" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="AI Telephony Pipleine" data-image-description="&lt;p&gt;Diagram showing the processing pipeline from telephony audio through LiveAPI to ElevenLabs TTS in an AI-powered voice system.&lt;/p&gt;
" data-image-caption="&lt;p&gt;Diagram showing the processing pipeline from telephony audio through LiveAPI to ElevenLabs TTS in an AI-powered voice system.&lt;/p&gt;
" data-medium-file="https://inero-software.com/wp-content/uploads/2025/11/Telephony_ElevenLabs_Pipeline-1-300x200.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/11/Telephony_ElevenLabs_Pipeline-1-1030x687.png" role="button" />													</div>
				</div>
				<div class="elementor-element elementor-element-1ed3b4d elementor-widget elementor-widget-text-editor" data-id="1ed3b4d" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h3 style="font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal;"><span lang="EN-US">3.3 Key Engineering Challenges</span></h3><p class="MsoNormal" style="font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal; font-weight: 300; font-size: 14px; font-family: Roboto, sans-serif;"><span lang="EN-US">Beyond typical engineering concerns like audio quality, session stability, and call routing, the most demanding challenge was not purely technical — it was understanding how real users communicate over the phone. Subtle behaviors such as interruptions, hesitation, changing tone, or switching context required careful analysis and extensive testing.</span></p><p style="font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal; font-weight: 300; font-size: 14px; font-family: Roboto, sans-serif;">We also dealt with several micro‑issues, such as premature call termination, incorrect end‑of‑utterance detection, and managing the timing between user speech and AI responses.</p><p style="font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal; font-weight: 300; font-size: 14px; font-family: Roboto, sans-serif;"> </p><h3 style="font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal;"><span lang="EN-US">3.4 What We Built Ourselves</span></h3><p class="MsoNormal" style="font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal; font-weight: 300; font-size: 14px; font-family: Roboto, sans-serif;"><span lang="EN-US">AI models are inherently non‑deterministic and cannot be fully controlled like classic software components. To ensure predictable and business‑aligned outcomes, we developed backend modules responsible for:<br />• Conversation flow supervision<br />• Session state tracking<br />• Monitoring and logging voice interactions<br />• Handling edge cases and ambiguous user inputs</span></p><p style="font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal; font-weight: 300; font-size: 14px; font-family: Roboto, sans-serif;">ElevenLabs’ tooling, especially the Hard Disk service, significantly supported our workflow, but the orchestration layer was built entirely by Inero.</p><p style="font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal; font-weight: 300; font-size: 14px; font-family: Roboto, sans-serif;"> </p><h3 style="font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal;"><span lang="EN-US">3.5 What We Learned</span></h3><p class="MsoNormal" style="font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal; font-weight: 300; font-size: 14px; font-family: Roboto, sans-serif;"><span lang="EN-US">The most important insight: designing a telephony AI system requires deep understanding of the user’s context, combined with the business objectives of the project. Quick prototyping and iterative PoC testing were essential — allowing us to validate conversational patterns early, reveal unexpected user behavior, and refine the interaction design.</span></p><p style="font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal; font-weight: 300; font-size: 14px; font-family: Roboto, sans-serif;">Ultimately, success depended on aligning the AI’s conversational style with how real customers naturally speak, pause, and respond during a phone call.</p>						</div>
				</div>
				</div>
		<div class="elementor-element elementor-element-4d8ebb5 e-con-full e-flex e-con e-child" data-id="4d8ebb5" data-element_type="container">
				</div>
					</div>
				</div>
		<div class="elementor-element elementor-element-36fce65 e-flex e-con-boxed e-con e-parent" data-id="36fce65" data-element_type="container">
					<div class="e-con-inner">
				<div class="elementor-element elementor-element-bafc838 elementor-widget elementor-widget-spacer" data-id="bafc838" data-element_type="widget" data-widget_type="spacer.default">
				<div class="elementor-widget-container">
					<div class="elementor-spacer">
			<div class="elementor-spacer-inner"></div>
		</div>
				</div>
				</div>
					</div>
				</div>
		<div class="elementor-element elementor-element-f0ecd4f e-flex e-con-boxed e-con e-parent" data-id="f0ecd4f" data-element_type="container">
					<div class="e-con-inner">
		<div class="elementor-element elementor-element-a477dbd e-con-full e-flex e-con e-child" data-id="a477dbd" data-element_type="container">
				</div>
		<div class="elementor-element elementor-element-326a90c e-con-full e-flex e-con e-child" data-id="326a90c" data-element_type="container">
				<div class="elementor-element elementor-element-1fab35c elementor-widget elementor-widget-text-editor" data-id="1fab35c" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h2><span lang="EN-US">4. GDPR Considerations in AI Telephony</span></h2><p> </p><p class="MsoNormal"><span lang="EN-US">All audio handling, session storage, and logging were designed according to GDPR principles: strict data minimisation, no training on user audio, encrypted transmission, and optional anonymisation of transcriptions. Where possible, processing was routed through EU‑aligned infrastructure.</span></p>						</div>
				</div>
				</div>
		<div class="elementor-element elementor-element-fdd54ad e-con-full e-flex e-con e-child" data-id="fdd54ad" data-element_type="container">
				</div>
					</div>
				</div>
		<div class="elementor-element elementor-element-59b4a48 e-flex e-con-boxed e-con e-parent" data-id="59b4a48" data-element_type="container">
					<div class="e-con-inner">
				<div class="elementor-element elementor-element-9ace4b8 elementor-widget elementor-widget-spacer" data-id="9ace4b8" data-element_type="widget" data-widget_type="spacer.default">
				<div class="elementor-widget-container">
					<div class="elementor-spacer">
			<div class="elementor-spacer-inner"></div>
		</div>
				</div>
				</div>
					</div>
				</div>
		<div class="elementor-element elementor-element-bc2dbef e-flex e-con-boxed e-con e-parent" data-id="bc2dbef" data-element_type="container">
					<div class="e-con-inner">
		<div class="elementor-element elementor-element-ec7d459 e-con-full e-flex e-con e-child" data-id="ec7d459" data-element_type="container">
				</div>
		<div class="elementor-element elementor-element-46c6762 e-con-full e-flex e-con e-child" data-id="46c6762" data-element_type="container">
				<div class="elementor-element elementor-element-792a12f elementor-widget elementor-widget-text-editor" data-id="792a12f" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h2><span lang="EN-US">Conclusion<o:p></o:p></span></h2><p>

</p><p class="MsoNormal"><span lang="EN-US">Implementing an AI‑driven telephony service
center requires more than connecting APIs — it requires understanding users,
managing nuanced conversational flows, and ensuring full compliance with EU
regulations. Our experience shows that LiveAPI technologies combined with
ElevenLabs can deliver highly human‑like, responsive, and scalable
communication channels for enterprise clients.<o:p></o:p></span></p>						</div>
				</div>
				</div>
		<div class="elementor-element elementor-element-421f13d e-con-full e-flex e-con e-child" data-id="421f13d" data-element_type="container">
				</div>
					</div>
				</div>
				</div>
		<p>Artykuł <a href="https://inero-software.com/enterprise-ai-telephony/">Implementing an AI-Powered Telephony Service Center with ElevenLabs &#038; LiveAPI</a> pochodzi z serwisu <a href="https://inero-software.com">Inero Software - Software Consulting</a>.</p>
]]></content:encoded>
					
		
		
		<post-id xmlns="com-wordpress:feed-additions:1">8238</post-id>	</item>
		<item>
		<title>Chatbot, Agent or AI Assistant? Find Out Which Solution Is Best for Your Business</title>
		<link>https://inero-software.com/chatbot-agent-or-ai-assistant-find-out-which-solution-is-best-for-your-business/</link>
		
		<dc:creator><![CDATA[Marta Kuprasz]]></dc:creator>
		<pubDate>Thu, 08 May 2025 08:57:21 +0000</pubDate>
				<category><![CDATA[AI]]></category>
		<category><![CDATA[Blog]]></category>
		<category><![CDATA[Company]]></category>
		<category><![CDATA[AI development]]></category>
		<category><![CDATA[AI innovations]]></category>
		<category><![CDATA[Artificial Intelligence]]></category>
		<category><![CDATA[BusinessProcessesOptimization]]></category>
		<category><![CDATA[ChatGPT]]></category>
		<category><![CDATA[Gemini]]></category>
		<category><![CDATA[Large Language Model]]></category>
		<category><![CDATA[LLM]]></category>
		<guid isPermaLink="false">https://inero-software.com/?p=7947</guid>

					<description><![CDATA[<p>Artificial intelligence and Large Language Models are buzzwords heard in nearly every industry. Many companies are wondering how to use them safely and which solution will be the most effective. There are plenty of options—and they’re often hard to tell apart. In this article, we break them down in a clear and easy-to-understand way.</p>
<p>Artykuł <a href="https://inero-software.com/chatbot-agent-or-ai-assistant-find-out-which-solution-is-best-for-your-business/">Chatbot, Agent or AI Assistant? Find Out Which Solution Is Best for Your Business</a> pochodzi z serwisu <a href="https://inero-software.com">Inero Software - Software Consulting</a>.</p>
]]></description>
										<content:encoded><![CDATA[		<div data-elementor-type="wp-post" data-elementor-id="7947" class="elementor elementor-7947" data-elementor-post-type="post">
				<div class="elementor-element elementor-element-c1eecc3 e-flex e-con-boxed e-con e-parent" data-id="c1eecc3" data-element_type="container">
					<div class="e-con-inner">
				<div class="elementor-element elementor-element-a23440b elementor-widget elementor-widget-html" data-id="a23440b" data-element_type="widget" data-widget_type="html.default">
				<div class="elementor-widget-container">
			 		</div>
				</div>
				<div class="elementor-element elementor-element-5054636 elementor-widget elementor-widget-text-editor" data-id="5054636" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h4>Artificial intelligence and Large Language Models are buzzwords heard in nearly every industry. Many companies are wondering how to use them safely and which solution will be the most effective. There are plenty of options—and they’re often hard to tell apart. In this article, we break them down in a clear and easy-to-understand way.</h4>						</div>
				</div>
				<div class="elementor-element elementor-element-ef953eb elementor-widget elementor-widget-text-editor" data-id="ef953eb" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>AI can take on many roles in a company—as a chatbot, assistant, agent, data analysis tool, content generator, or knowledge search engine. So how can you choose the solution that best fits your employees’ needs? It helps to understand what each option has to offer.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-3d8a982 elementor-widget elementor-widget-heading" data-id="3d8a982" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Chatbot – answers questions, provides explanations, and handles requests
</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-9aafe69 elementor-widget elementor-widget-text-editor" data-id="9aafe69" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>This is the most common use of AI in areas such as customer service and sales. An AI chatbot based on a large language model, such as ChatGPT, can hold natural conversations, understand the context of inquiries, and deliver accurate answers—24/7, in multiple languages, and without human involvement.</p><p> </p><p>These solutions are typically implemented on websites, in messaging platforms (like Messenger or WhatsApp), or within helpdesk systems, where they assist with answering questions, tracking orders, or providing product information. As a result, they significantly automate customer service, reduce operational costs, and improve customer satisfaction ratings.</p><p> </p><p>For the purposes of this article, we define a chatbot as an AI interface primarily intended for external users—in other words, it operates “outside the company.” This definition distinguishes it from AI agents, which perform more complex tasks within internal processes by integrating with systems, databases, or APIs.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-67e3688 elementor-widget elementor-widget-image" data-id="67e3688" data-element_type="widget" data-widget_type="image.default">
				<div class="elementor-widget-container">
													<img decoding="async" width="1030" height="408" src="https://inero-software.com/wp-content/uploads/2025/05/Zrzut-ekranu-2025-05-06-122226-1030x408.png" class="attachment-large size-large wp-image-7936" alt="" srcset="https://inero-software.com/wp-content/uploads/2025/05/Zrzut-ekranu-2025-05-06-122226-1030x408.png 1030w, https://inero-software.com/wp-content/uploads/2025/05/Zrzut-ekranu-2025-05-06-122226-300x119.png 300w, https://inero-software.com/wp-content/uploads/2025/05/Zrzut-ekranu-2025-05-06-122226-768x304.png 768w, https://inero-software.com/wp-content/uploads/2025/05/Zrzut-ekranu-2025-05-06-122226-1536x609.png 1536w, https://inero-software.com/wp-content/uploads/2025/05/Zrzut-ekranu-2025-05-06-122226-757x300.png 757w, https://inero-software.com/wp-content/uploads/2025/05/Zrzut-ekranu-2025-05-06-122226.png 1832w" sizes="(max-width: 1030px) 100vw, 1030px" data-attachment-id="7936" data-permalink="https://inero-software.com/pl/chatbot-agent-czy-asystent-ai-sprawdz-ktore-rozwiazanie-najlepiej-sprawdzi-sie-w-twoim-biznesie/zrzut-ekranu-2025-05-06-122226/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/05/Zrzut-ekranu-2025-05-06-122226.png" data-orig-size="1832,726" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="Zrzut ekranu 2025-05-06 122226" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/05/Zrzut-ekranu-2025-05-06-122226-300x119.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/05/Zrzut-ekranu-2025-05-06-122226-1030x408.png" role="button" />													</div>
				</div>
				<div class="elementor-element elementor-element-fb8d9b1 elementor-widget elementor-widget-text-editor" data-id="fb8d9b1" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><a href="https://www.incone60.eu/seastat">https://www.incone60.eu/seastat</a></p><p> </p>						</div>
				</div>
				<div class="elementor-element elementor-element-5fb00e5 elementor-widget elementor-widget-spacer" data-id="5fb00e5" data-element_type="widget" data-widget_type="spacer.default">
				<div class="elementor-widget-container">
					<div class="elementor-spacer">
			<div class="elementor-spacer-inner"></div>
		</div>
				</div>
				</div>
				<div class="elementor-element elementor-element-70e37da elementor-widget elementor-widget-heading" data-id="70e37da" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">AI Agent – a tool designed to carry out specific tasks</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-ae7ea10 elementor-widget elementor-widget-text-editor" data-id="ae7ea10" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p class="" data-start="0" data-end="327">Unlike a chatbot, which interacts with external users, an AI agent operates within the organization and supports employees by automating specific business processes. It’s not a one-size-fits-all tool—it’s built with a clearly defined purpose in mind, such as document processing, data analysis, or integration with ERP systems.</p><p data-start="0" data-end="327"> </p><p class="" data-start="329" data-end="590">Thanks to large language models like Gemini or Claude, an AI agent can understand context, make decisions, and trigger specific actions—without human input. It can run in the background, process data from multiple sources, manage files, or handle email inboxes. Each AI agent is tailored to the company’s individual needs and specific tasks. Only then can it offer real value instead of becoming just another generic tool.</p><p class="" data-start="754" data-end="930">Want to see how this works in practice?</p><p class="" data-start="754" data-end="930"><br data-start="793" data-end="796" />Check out our case study:<a href="https://inero-software.com/meet-your-personal-ai-agent-a-case-study-for-a-freight-forwarding-company/"> Meet your personal AI agent-a case study for a freight forwarding company</a> – where we describe how we built an agent integrated with an email inbox.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-272f47a elementor-widget__width-initial elementor-widget elementor-widget-video" data-id="272f47a" data-element_type="widget" data-settings="{&quot;youtube_url&quot;:&quot;https:\/\/youtu.be\/B4VxxjWYzDM&quot;,&quot;video_type&quot;:&quot;youtube&quot;,&quot;controls&quot;:&quot;yes&quot;}" data-widget_type="video.default">
				<div class="elementor-widget-container">
					<div class="elementor-wrapper elementor-open-inline">
			<div class="elementor-video"></div>		</div>
				</div>
				</div>
				<div class="elementor-element elementor-element-a535da1 elementor-widget elementor-widget-spacer" data-id="a535da1" data-element_type="widget" data-widget_type="spacer.default">
				<div class="elementor-widget-container">
					<div class="elementor-spacer">
			<div class="elementor-spacer-inner"></div>
		</div>
				</div>
				</div>
				<div class="elementor-element elementor-element-a575c44 elementor-widget elementor-widget-heading" data-id="a575c44" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">AI Assistant – supports users in daily work by operating contextually and “in the background”</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-ddbd088 elementor-widget elementor-widget-text-editor" data-id="ddbd088" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>Unlike a chatbot that answers questions or an agent that automates a specific process, an AI assistant is a tool that works alongside employees in real time—it understands context, suggests next steps, and makes tasks easier within familiar applications.</p><p> </p><p>It’s typically integrated into a specific work environment, such as a word processor, spreadsheet, CRM, or project management tool. The assistant doesn’t replace the user—it actively supports them in making decisions, writing, analyzing data, or planning.</p><p> </p><p>AI assistants like GitHub Copilot, Notion AI, or Google’s Workspace assistant show how this technology can genuinely boost team productivity and reduce time spent on routine tasks. From a business perspective, a well-designed assistant can improve work quality, reduce errors, and make onboarding new employees easier.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-ebf3d14 elementor-widget elementor-widget-spacer" data-id="ebf3d14" data-element_type="widget" data-widget_type="spacer.default">
				<div class="elementor-widget-container">
					<div class="elementor-spacer">
			<div class="elementor-spacer-inner"></div>
		</div>
				</div>
				</div>
				<div class="elementor-element elementor-element-823b953 elementor-widget elementor-widget-heading" data-id="823b953" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Other Business Applications of Large Language Models</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-767d863 elementor-widget elementor-widget-text-editor" data-id="767d863" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>The possibilities go far beyond chatbots, assistants, or agents. These models can take on specialized roles, supporting tasks such as document processing, data analysis, or content creation. They’re increasingly used to automatically summarize reports, extract information from unstructured sources (like emails, PDFs, or scanned forms), or answer natural-language questions based on internal documentation.</p><p> </p><p>LLMs can also assist marketing teams by generating suggestions for ad copy, product descriptions, or sales messages tailored to the company’s style. In analytics departments, they provide faster access to data—generating database queries, interpreting results, and presenting insights in a way that’s easy for non-technical users to understand. These applications often don’t require building a new tool from scratch, but rather integrating the AI model into existing company systems. This way, the technology supports specific tasks—right where it’s needed.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-0a9debf elementor-widget elementor-widget-spacer" data-id="0a9debf" data-element_type="widget" data-widget_type="spacer.default">
				<div class="elementor-widget-container">
					<div class="elementor-spacer">
			<div class="elementor-spacer-inner"></div>
		</div>
				</div>
				</div>
				<div class="elementor-element elementor-element-3481b69 elementor-widget elementor-widget-heading" data-id="3481b69" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">AI Models and Data Security
</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-5be148c elementor-widget elementor-widget-text-editor" data-id="5be148c" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>Business owners and managers still approach AI tools with caution, mainly because they’re unsure how to ensure the security and confidentiality of processed data. We’ve explored these topics in previous publications that are worth reviewing.</p><p> </p><p>In the article <em>“</em><a href="https://inero-software.com/ai-user-privacy-an-analysis-of-platform-policies/" rel="bookmark"><strong>AI User Privacy: An Analysis of Platform Policies</strong></a><em>”</em>, we outlined the data privacy and model training policies followed by major AI providers such as OpenAI, Google Gemini, Microsoft’s Azure OpenAI, and Anthropic’s Claude.</p><p> </p><p>For those considering an on-premise solution, we recommend the blog post <em>“</em><strong><a href="https://inero-software.com/top-lightweight-llms-for-local-deployment/" rel="bookmark">Top Lightweight LLMs for Local Deployment</a></strong><em>”</em> There, we reviewed several top open-source lightweight LLMs and explained how to run them on a local Windows machine—even with limited GPU resources.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-b40d87c elementor-widget elementor-widget-text-editor" data-id="b40d87c" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>Choosing the right AI tool for your company depends primarily on the goal it’s meant to achieve. A chatbot works best where quick and accessible customer service is key. An AI agent can automate repetitive internal processes and improve information flow between systems. An AI assistant provides day-to-day support for employees—offering suggestions, summaries, or preparing data for further use.</p><p> </p><p>Large language models also allow integration with existing processes—without the need to build a dedicated tool from scratch. However, implementing AI-based technology requires a well-thought-out decision, taking into account both efficiency and data security. If you&#8217;re looking to adopt AI in your company and need an experienced partner to guide you through the process, get in touch with us.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-d041a5c elementor-cta--skin-cover elementor-animated-content elementor-bg-transform elementor-bg-transform-zoom-in elementor-widget elementor-widget-call-to-action" data-id="d041a5c" data-element_type="widget" data-widget_type="call-to-action.default">
				<div class="elementor-widget-container">
					<a class="elementor-cta" href="https://inero-software.com/contact-us/">
					<div class="elementor-cta__bg-wrapper">
				<div class="elementor-cta__bg elementor-bg" style="background-image: url(https://inero-software.com/wp-content/uploads/2025/03/cta-1903-1030x579.png);" role="img" aria-label="cta 1903"></div>
				<div class="elementor-cta__bg-overlay"></div>
			</div>
							<div class="elementor-cta__content">
				
									<h2 class="elementor-cta__title elementor-cta__content-item elementor-content-item elementor-animated-item--grow">
						Bring AI into Your Business					</h2>
				
									<div class="elementor-cta__description elementor-cta__content-item elementor-content-item elementor-animated-item--grow">
						We provide professional consulting and end-to-end implementation of tools based on large language models.
					</div>
				
									<div class="elementor-cta__button-wrapper elementor-cta__content-item elementor-content-item elementor-animated-item--grow">
					<span class="elementor-cta__button elementor-button elementor-size-">
						Contact Us					</span>
					</div>
							</div>
						</a>
				</div>
				</div>
					</div>
				</div>
				</div>
		<p>Artykuł <a href="https://inero-software.com/chatbot-agent-or-ai-assistant-find-out-which-solution-is-best-for-your-business/">Chatbot, Agent or AI Assistant? Find Out Which Solution Is Best for Your Business</a> pochodzi z serwisu <a href="https://inero-software.com">Inero Software - Software Consulting</a>.</p>
]]></content:encoded>
					
		
		
		<post-id xmlns="com-wordpress:feed-additions:1">7947</post-id>	</item>
		<item>
		<title>AI User Privacy: An Analysis of Platform Policies</title>
		<link>https://inero-software.com/ai-user-privacy-an-analysis-of-platform-policies/</link>
		
		<dc:creator><![CDATA[Martyna Mul]]></dc:creator>
		<pubDate>Wed, 30 Apr 2025 08:35:35 +0000</pubDate>
				<category><![CDATA[AI]]></category>
		<category><![CDATA[Company]]></category>
		<category><![CDATA[AI development]]></category>
		<category><![CDATA[AI innovations]]></category>
		<category><![CDATA[Artificial Intelligence]]></category>
		<category><![CDATA[ChatGPT]]></category>
		<category><![CDATA[Gemini]]></category>
		<category><![CDATA[Large Language Model]]></category>
		<category><![CDATA[LLM]]></category>
		<category><![CDATA[Privacy Policies]]></category>
		<guid isPermaLink="false">https://inero-software.com/?p=7890</guid>

					<description><![CDATA[<p>In this article, we’ll break down the data privacy policies of top AI platforms. You will also learn what to do to ensure your data is not used for training Large Language Models (LLM).</p>
<p>Artykuł <a href="https://inero-software.com/ai-user-privacy-an-analysis-of-platform-policies/">AI User Privacy: An Analysis of Platform Policies</a> pochodzi z serwisu <a href="https://inero-software.com">Inero Software - Software Consulting</a>.</p>
]]></description>
										<content:encoded><![CDATA[		<div data-elementor-type="wp-post" data-elementor-id="7890" class="elementor elementor-7890" data-elementor-post-type="post">
				<div class="elementor-element elementor-element-bc35505 e-flex e-con-boxed e-con e-parent" data-id="bc35505" data-element_type="container">
					<div class="e-con-inner">
				<div class="elementor-element elementor-element-44ba7b6 elementor-widget elementor-widget-html" data-id="44ba7b6" data-element_type="widget" data-widget_type="html.default">
				<div class="elementor-widget-container">
			 		</div>
				</div>
				<div class="elementor-element elementor-element-23d3d65 elementor-widget elementor-widget-text-editor" data-id="23d3d65" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h4>Ever wondered where your data goes when you interact with AI cloud platforms? Or is it used to train future models? In this article, we’ll break down the data privacy policies of top AI platforms. You will also learn what to do to ensure your data is not used for training Large Language Models (LLM).</h4>						</div>
				</div>
				<div class="elementor-element elementor-element-18af7ef elementor-widget elementor-widget-text-editor" data-id="18af7ef" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>Major AI cloud providers have become increasingly transparent about their data usage policies &#8211; especially when it comes to training models. While most platforms, particularly those offering enterprise-level services, do not use your inputs and outputs for training by default, the fine print matters. Understanding how these services handle your data &#8211; and how you can maintain control &#8211; is essential.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-e8dd97a elementor-widget elementor-widget-text-editor" data-id="e8dd97a" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>In this article, we’ll break down the data privacy and model training policies of top AI platforms, including OpenAI, Google Gemini, Microsoft’s Azure OpenAI and Anthropic’s Claude. You’ll learn:</p>						</div>
				</div>
				<div class="elementor-element elementor-element-33a2f78 elementor-widget elementor-widget-text-editor" data-id="33a2f78" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li>How AI platforms use your data and whether your data is used to train models by default</li><li>How to prevent AI from using your data opt, if needed</li><li>Where your data is stored (data residency), and</li><li>What compliance measures (like GDPR) apply</li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-291cb3e elementor-widget elementor-widget-text-editor" data-id="291cb3e" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>Adopting AI isn’t just about prompt engineering or model performance. It’s also about knowing where your data goes—and how to ensure it stays under your control.</p><p><strong>Here’s what you need to know:</strong></p>						</div>
				</div>
				<div class="elementor-element elementor-element-ecb1c2a elementor-widget elementor-widget-spacer" data-id="ecb1c2a" data-element_type="widget" data-widget_type="spacer.default">
				<div class="elementor-widget-container">
					<div class="elementor-spacer">
			<div class="elementor-spacer-inner"></div>
		</div>
				</div>
				</div>
				<div class="elementor-element elementor-element-2add4a6 elementor-widget elementor-widget-heading" data-id="2add4a6" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">OpenAI – Data Usage and Privacy</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-cb6fb79 elementor-widget elementor-widget-text-editor" data-id="cb6fb79" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>OpenAI treats your data differently based on how you interact with its services:</p><p><strong>ChatGPT App (Web/Mobile)</strong></p><p>When you chat with ChatGPT, your conversations may be used to train AI models &#8211; unless you manually opt out. To prevent your data from being used:</p>						</div>
				</div>
				<div class="elementor-element elementor-element-01b1f1c elementor-widget elementor-widget-text-editor" data-id="01b1f1c" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li>Go to Settings → Data Controls → Improve the model for everyone and toggle it off.</li><li>Even with the opt-out, OpenAI stores chats for 30 days for abuse monitoring before deletion.</li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-1fb6e1a elementor-widget elementor-widget-image" data-id="1fb6e1a" data-element_type="widget" data-widget_type="image.default">
				<div class="elementor-widget-container">
													<img loading="lazy" decoding="async" data-attachment-id="7897" data-permalink="https://inero-software.com/ai-user-privacy-an-analysis-of-platform-policies/image-2-2/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/04/image-2-1.png" data-orig-size="602,407" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="image (2)" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/04/image-2-1-300x203.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/04/image-2-1.png" tabindex="0" role="button" width="602" height="407" src="https://inero-software.com/wp-content/uploads/2025/04/image-2-1.png" class="attachment-large size-large wp-image-7897" alt="" srcset="https://inero-software.com/wp-content/uploads/2025/04/image-2-1.png 602w, https://inero-software.com/wp-content/uploads/2025/04/image-2-1-300x203.png 300w, https://inero-software.com/wp-content/uploads/2025/04/image-2-1-444x300.png 444w" sizes="(max-width: 602px) 100vw, 602px" data-attachment-id="7897" data-permalink="https://inero-software.com/ai-user-privacy-an-analysis-of-platform-policies/image-2-2/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/04/image-2-1.png" data-orig-size="602,407" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="image (2)" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/04/image-2-1-300x203.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/04/image-2-1.png" role="button" />													</div>
				</div>
				<div class="elementor-element elementor-element-422566b elementor-widget elementor-widget-heading" data-id="422566b" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">OpenAI API and ChatGPT Enterprise</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-0be90ca elementor-widget elementor-widget-text-editor" data-id="0be90ca" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>If you&#8217;re a developer or a business using <strong>OpenAI&#8217;s API</strong> or <strong>ChatGPT Enterprise</strong>, there’s no need to opt out. By default, <strong>OpenAI does not use API or Enterprise data to train its models</strong>, and <strong>your data stays private</strong>. You don’t need to do anything to opt out &#8211; it’s already protected. You can choose to share data to help improve the model, but only if you want to.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-d497044 elementor-widget elementor-widget-heading" data-id="d497044" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h4 class="elementor-heading-title elementor-size-default">Data Residency  </h4>		</div>
				</div>
				<div class="elementor-element elementor-element-bd96e19 elementor-widget elementor-widget-text-editor" data-id="bd96e19" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span data-contrast="auto">OpenAI’s servers are mostly based in the </span><strong>United States</strong><span data-contrast="auto"><strong>,</strong> and currently, if you&#8217;re using the API directly, </span><strong>you can’t choose where your data is stored</strong><span data-contrast="auto"><strong>.</strong> That means your data is processed within OpenAI’s own infrastructure &#8211; protected by strong security, but </span><strong>not necessarily hosted in your country. </strong></p><p><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p><p><span data-contrast="auto">However, there’s some progress for enterprise users. OpenAI recently introduced an option for </span><strong>eligible enterprise API</strong><b><span data-contrast="auto"> customers</span></b><span data-contrast="auto"> that allows data to be stored in </span><strong>Europe</strong><span data-contrast="auto">, provided there’s a specific agreement in place.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p><p><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p><p><strong>If regional data residency</strong><span data-contrast="auto"> is important for your business &#8211; say, for GDPR or internal compliance &#8211; you might want to consider using </span><strong>Azure OpenAI</strong><span data-contrast="auto">, which hosts OpenAI’s models on Microsoft’s cloud. With Azure, you can choose a region like </span><strong>Western Europe or Asia</strong><span data-contrast="auto"><strong>,</strong> and all data processing and storage will stay within that geography.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p><p><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p><p><span data-contrast="auto">We’ll dive into Azure more in the next section &#8211; but in short: </span><strong>OpenAI handles your data securely</strong><span data-contrast="auto">, but for strict control over </span><i><span data-contrast="auto">where</span></i><span data-contrast="auto"> it lives, </span><b><span data-contrast="auto">a</span></b><strong> partner cloud service like Azure may be a better fit. </strong></p>						</div>
				</div>
				<div class="elementor-element elementor-element-5c3e1ec elementor-widget elementor-widget-spacer" data-id="5c3e1ec" data-element_type="widget" data-widget_type="spacer.default">
				<div class="elementor-widget-container">
					<div class="elementor-spacer">
			<div class="elementor-spacer-inner"></div>
		</div>
				</div>
				</div>
				<div class="elementor-element elementor-element-0a6231f elementor-widget elementor-widget-heading" data-id="0a6231f" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Google (Gemini) – Google’s Approach to Your Data </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-c7c8d68 elementor-widget elementor-widget-text-editor" data-id="c7c8d68" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span data-contrast="auto">Google’s foray into generative AI includes </span><strong>Gemini</strong><span data-contrast="auto">, a next-generation model that powers products like Google Gemini (the chatbot) and various enterprise AI offerings on Google Cloud. Here&#8217;s how they handle your data:</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:240}"> </span></p><p><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:240}"> </span></p><h5><b><span data-contrast="auto">Gemini App</span></b><span data-ccp-props="{}"> </span></h5><div><span data-ccp-props="{}"> </span></div><p><strong>By default, Google does save your Gemini chat history to your account (much like search history) and may use it to improve their service. However, Google provides a “Gemini Activity” setting to control this</strong><span data-contrast="auto"><strong>.</strong> </span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:240}"> </span></p><p><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:240}"> </span></p><p><span data-contrast="auto">To manage this:</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-83c9f69 elementor-widget elementor-widget-text-editor" data-id="83c9f69" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="5" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1"><span data-contrast="auto">Visit </span><strong>Gemini Activity</strong><span data-contrast="auto"> settings.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="5" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="2" data-aria-level="1"><span data-contrast="auto">Pause Gemini Activity to stop saving chats and prevent them from being used in </span><strong>AI model training data sources. </strong></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="5" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="3" data-aria-level="1"><span data-contrast="auto">You can also delete existing conversation history.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-13a61aa elementor-widget elementor-widget-text-editor" data-id="13a61aa" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><a href="https://support.google.com/gemini/answer/13594961#your_data"><span class="TextRun Underlined SCXW259565000 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW259565000 BCX0" data-ccp-charstyle="Hyperlink">T</span></span><span class="TextRun Underlined SCXW259565000 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW259565000 BCX0" data-ccp-charstyle="Hyperlink">urning off </span><span class="NormalTextRun SCXW259565000 BCX0" data-ccp-charstyle="Hyperlink">Gemini</span></span><span class="TextRun Underlined SCXW259565000 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW259565000 BCX0" data-ccp-charstyle="Hyperlink"> Activity</span></span></a><span class="TextRun SCXW259565000 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW259565000 BCX0"> means </span></span><span class="TextRun SCXW259565000 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW259565000 BCX0">your new chats </span><span class="NormalTextRun SCXW259565000 BCX0">won’t</span><span class="NormalTextRun SCXW259565000 BCX0"> be used to improve the</span><span class="NormalTextRun SCXW259565000 BCX0">ir</span> <span class="NormalTextRun SCXW259565000 BCX0">machine learning services</span></span><span class="TextRun SCXW259565000 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW259565000 BCX0">, nor will they be seen by human reviewers, </span><span class="NormalTextRun SCXW259565000 BCX0">unless</span><span class="NormalTextRun SCXW259565000 BCX0"> you explicitly </span><span class="NormalTextRun SCXW259565000 BCX0">submit</span><span class="NormalTextRun SCXW259565000 BCX0"> them as feedback. This gives regular us</span><span class="NormalTextRun SCXW259565000 BCX0">ers a way </span><span class="NormalTextRun SCXW259565000 BCX0">to opt out, </span><span class="NormalTextRun SCXW259565000 BCX0">similar to</span><span class="NormalTextRun SCXW259565000 BCX0"> ChatGPT’s opt-out toggle.</span></span><span class="EOP SCXW259565000 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-cb94ad1 elementor-widget elementor-widget-image" data-id="cb94ad1" data-element_type="widget" data-widget_type="image.default">
				<div class="elementor-widget-container">
													<img loading="lazy" decoding="async" data-attachment-id="7901" data-permalink="https://inero-software.com/ai-user-privacy-an-analysis-of-platform-policies/image-1/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/04/image-1.png" data-orig-size="712,332" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="image (1)" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/04/image-1-300x140.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/04/image-1.png" tabindex="0" role="button" width="712" height="332" src="https://inero-software.com/wp-content/uploads/2025/04/image-1.png" class="attachment-large size-large wp-image-7901" alt="" srcset="https://inero-software.com/wp-content/uploads/2025/04/image-1.png 712w, https://inero-software.com/wp-content/uploads/2025/04/image-1-300x140.png 300w, https://inero-software.com/wp-content/uploads/2025/04/image-1-643x300.png 643w" sizes="(max-width: 712px) 100vw, 712px" data-attachment-id="7901" data-permalink="https://inero-software.com/ai-user-privacy-an-analysis-of-platform-policies/image-1/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/04/image-1.png" data-orig-size="712,332" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="image (1)" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/04/image-1-300x140.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/04/image-1.png" role="button" />													</div>
				</div>
				<div class="elementor-element elementor-element-e57f550 elementor-widget elementor-widget-text-editor" data-id="e57f550" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW161006688 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW161006688 BCX0">To stop saving your conversations, go to the </span></span><span class="TextRun SCXW161006688 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW161006688 BCX0">Activity </span></span><span class="TextRun SCXW161006688 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW161006688 BCX0">tab and toggle </span></span><span class="TextRun SCXW161006688 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW161006688 BCX0">Gemini Apps Activity</span></span><span class="TextRun SCXW161006688 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW161006688 BCX0">. </span><span class="NormalTextRun SCXW161006688 BCX0">You can also </span><span class="NormalTextRun SCXW161006688 BCX0">delete</span><span class="NormalTextRun SCXW161006688 BCX0"> your past conversations.</span></span><span class="EOP SCXW161006688 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-ca02a5a elementor-widget elementor-widget-heading" data-id="ca02a5a" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h5 class="elementor-heading-title elementor-size-default">API and Vertex AI </h5>		</div>
				</div>
				<div class="elementor-element elementor-element-73c636b elementor-widget elementor-widget-text-editor" data-id="73c636b" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW147481227 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW147481227 BCX0">If </span><span class="NormalTextRun SCXW147481227 BCX0">you’re</span><span class="NormalTextRun SCXW147481227 BCX0"> using Google Cloud’s </span></span><span class="TextRun SCXW147481227 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW147481227 BCX0">Vertex AI</span></span><span class="TextRun SCXW147481227 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW147481227 BCX0"> platform:</span></span><span class="EOP SCXW147481227 BCX0" data-ccp-props="{}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-5da483c elementor-widget elementor-widget-text-editor" data-id="5da483c" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="1" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="5" data-aria-level="1"><span data-contrast="auto">Your prompts and outputs are </span><strong>not used to train AI models</strong><span data-contrast="auto"> without explicit permission.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="1" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="6" data-aria-level="1"><span data-contrast="auto">Data may be cached briefly (up to 24 hours) for performance but remains within your selected geographic region.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="1" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="7" data-aria-level="1"><span data-contrast="auto">Businesses can opt for a </span><strong>zero-retention policy</strong><span data-contrast="auto"> for maximum privacy.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-15e5fa7 elementor-widget elementor-widget-heading" data-id="15e5fa7" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h5 class="elementor-heading-title elementor-size-default">Data residency  </h5>		</div>
				</div>
				<div class="elementor-element elementor-element-6769505 elementor-widget elementor-widget-text-editor" data-id="6769505" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW242043066 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW242043066 BCX0">Data residency is a strong point for Google: you can choose which geographic region your AI service runs in (e.g. </span><span class="NormalTextRun SCXW242043066 BCX0">EU or U</span><span class="NormalTextRun SCXW242043066 BCX0">S data </span><span class="NormalTextRun SpellingErrorV2Themed SCXW242043066 BCX0">centers</span><span class="NormalTextRun SCXW242043066 BCX0">), and Google will process and store data in that region to meet any data localization requirements.</span></span><span class="EOP SCXW242043066 BCX0" data-ccp-props="{}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-dffefeb elementor-widget elementor-widget-spacer" data-id="dffefeb" data-element_type="widget" data-widget_type="spacer.default">
				<div class="elementor-widget-container">
					<div class="elementor-spacer">
			<div class="elementor-spacer-inner"></div>
		</div>
				</div>
				</div>
				<div class="elementor-element elementor-element-e7c3b12 elementor-widget elementor-widget-heading" data-id="e7c3b12" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Microsoft Azure OpenAI – Enterprise Data Protection by Design </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-36c3a52 elementor-widget elementor-widget-heading" data-id="36c3a52" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h5 class="elementor-heading-title elementor-size-default">Training Policy </h5>		</div>
				</div>
				<div class="elementor-element elementor-element-657a095 elementor-widget elementor-widget-text-editor" data-id="657a095" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span data-contrast="auto">Microsoft’s Azure OpenAI Service lets companies use OpenAI’s models through the trusted Azure cloud platform. </span><strong>Privacy is a major selling point here</strong><span data-contrast="auto"><strong>.</strong> Microsoft is very explicit: </span><strong>any data you send into Azure OpenAI is not used to train the underlying models</strong><span data-contrast="auto"> or improve Microsoft’s or OpenAI’s services</span><span data-ccp-props="{&quot;134245418&quot;:true,&quot;134245529&quot;:true}"> .</span></p><p><span data-ccp-props="{&quot;134245418&quot;:true,&quot;134245529&quot;:true}"> </span></p><p><span data-contrast="none">Microsoft’s Azure OpenAI Service essentially hosts OpenAI’s models (GPT-4, GPT-3.5, etc.) within the Microsoft Azure cloud. Microsoft has specifically designed this service for enterprises that require strong privacy protections. Key aspects are:</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-96820b8 elementor-widget elementor-widget-text-editor" data-id="96820b8" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="6" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1"><span data-contrast="none">Any data you input into Azure OpenAI – prompts, completions (model outputs), embeddings, fine-tuning data – is not used to train the AI models. </span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="6" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="2" data-aria-level="1"><span data-contrast="none">Your inputs and outputs “are NOT available to other customers, are NOT available to OpenAI, and are NOT used to improve OpenAI models”. </span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="6" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="3" data-aria-level="1"><span data-contrast="none">Microsoft only retains data as needed to provide the service and monitor for misuse. In fact, prompts and outputs on Azure are stored only temporarily (up to 30 days) by default, and solely for abuse detection purposes. After 30 days, those prompts are deleted. If even this temporary storage is a concern (say, for ultra-sensitive data), Microsoft offers a process called “modified abuse monitoring” where you can request that even the 30-day storage be bypassed, meaning no prompts are retained at all. Typically, you’d need approval for this exception, but it’s an option for high-security scenarios.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:240}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-5e2b615 elementor-widget elementor-widget-heading" data-id="5e2b615" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h5 class="elementor-heading-title elementor-size-default">Data Residency </h5>		</div>
				</div>
				<div class="elementor-element elementor-element-82ccf7d elementor-widget elementor-widget-text-editor" data-id="82ccf7d" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW93588553 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW93588553 BCX0">Because </span><span class="NormalTextRun SCXW93588553 BCX0">it’s</span><span class="NormalTextRun SCXW93588553 BCX0"> on Azure, you also </span><span class="NormalTextRun SCXW93588553 BCX0">benefit</span><span class="NormalTextRun SCXW93588553 BCX0"> from easily choosing the region and </span><span class="NormalTextRun SCXW93588553 BCX0">complying with</span><span class="NormalTextRun SCXW93588553 BCX0"> data residency requirements. When setting up Azure OpenAI, you deploy the service to an Azure region (for example, East US, West Europe, Southeast Asia, etc.). All processing and data storage for inference will occur within that region or its geographical boundary. So, if you deploy in Western Europe, your data </span><span class="NormalTextRun SCXW93588553 BCX0">isn’t</span><span class="NormalTextRun SCXW93588553 BCX0"> leaving Europe </span><span class="NormalTextRun SCXW93588553 BCX0">&#8211;</span><span class="NormalTextRun SCXW93588553 BCX0"> crucial for GDPR compliance. Azure itself meets </span><span class="NormalTextRun SCXW93588553 BCX0">numerous</span><span class="NormalTextRun SCXW93588553 BCX0"> compliance standards (SOC 2, ISO 27001, </span><span class="NormalTextRun SCXW93588553 BCX0">etc.)</span><span class="NormalTextRun SCXW93588553 BCX0">, and these extend to Azure OpenAI as an Azure service.</span></span><span class="EOP SCXW93588553 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-cea2902 elementor-widget elementor-widget-spacer" data-id="cea2902" data-element_type="widget" data-widget_type="spacer.default">
				<div class="elementor-widget-container">
					<div class="elementor-spacer">
			<div class="elementor-spacer-inner"></div>
		</div>
				</div>
				</div>
				<div class="elementor-element elementor-element-0013609 elementor-widget elementor-widget-heading" data-id="0013609" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Anthropic (Claude) – A Privacy-First AI Assistant </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-6f1b8b4 elementor-widget elementor-widget-heading" data-id="6f1b8b4" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h5 class="elementor-heading-title elementor-size-default">Training Policy </h5>		</div>
				</div>
				<div class="elementor-element elementor-element-988001e elementor-widget elementor-widget-text-editor" data-id="988001e" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW126360551 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW126360551 BCX0">Anthropic, the company behind the Claude AI assistant (Claude 2 and newer versions), has emphasized a privacy-conscious approach from the outset. </span><span class="NormalTextRun SCXW126360551 BCX0">Anthropic adopts an opt-in approach:</span></span><span class="EOP SCXW126360551 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-3f7e219 elementor-widget elementor-widget-text-editor" data-id="3f7e219" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="7" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1"><span data-contrast="none">By default, Anthropic does not use your conversations or data to train its models. This applies to both their commercial offerings (</span><a href="https://privacy.anthropic.com/en/collections/10663361-commercial-customers"><span data-contrast="none">Claude for Work, Anthropic API</span></a><span data-contrast="none">)</span> <span data-contrast="none">and consumer products (Claude Free, Claude Pro)</span> <span data-contrast="none">– your prompts and Claude’s responses aren’t automatically used for model training. </span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="7" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="2" data-aria-level="1"><span data-contrast="none">They only use data if you deliberately opt-in, such as by providing explicit feedback. For instance, if you click a thumbs-up/down in a Claude interface or send data to their feedback channels, you’re essentially saying “you can learn from this”.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:240}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-00d6994 elementor-widget elementor-widget-text-editor" data-id="00d6994" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW11925797 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW11925797 BCX0">For enterprise clients, Anthropic offers Claude Team/Enterprise, which not only guarantees no training on your data but also provides admin controls. One such feature is custom data retention settings. By default, Anthropic’s systems might </span><span class="NormalTextRun SCXW11925797 BCX0">retain</span><span class="NormalTextRun SCXW11925797 BCX0"> your inputs/outputs indefinitely for your account (though not for training). However, Claude Enterprise admins can set a retention policy – for example, you might set it to </span><span class="NormalTextRun SCXW11925797 BCX0">delete</span><span class="NormalTextRun SCXW11925797 BCX0"> all conversation data after 30 days, 60 days, etc., with 30 days being the current minimum. These controls aim to support compliance with regulations like GDPR.</span></span><span class="EOP SCXW11925797 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-5a24ccc elementor-widget elementor-widget-heading" data-id="5a24ccc" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h5 class="elementor-heading-title elementor-size-default">Data Residency  </h5>		</div>
				</div>
				<div class="elementor-element elementor-element-3cf1dac elementor-widget elementor-widget-text-editor" data-id="3cf1dac" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW47979688 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW47979688 BCX0">Anthropic is a newer player, and currently, when you use their API directly, you </span><span class="NormalTextRun SCXW47979688 BCX0">don’t</span><span class="NormalTextRun SCXW47979688 BCX0"> explicitly choose a data region – </span><span class="NormalTextRun SCXW47979688 BCX0">it’s</span> <span class="NormalTextRun SCXW47979688 BCX0">likely hosted</span><span class="NormalTextRun SCXW47979688 BCX0"> in the US by Anthropic (or </span><span class="NormalTextRun SCXW47979688 BCX0">possibly through</span><span class="NormalTextRun SCXW47979688 BCX0"> cloud providers like AWS in the US region). However, Anthropic models are also available through partners, which can help with data residency. For example, Anthropic’s Claude is offered via Amazon Bedrock (AWS’s AI service) and via Google Cloud Vertex AI. If you use Claude through one of these platforms, you can take advantage of AWS’s or Google’s region controls.</span></span><span class="EOP SCXW47979688 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-a2a60c8 elementor-widget elementor-widget-spacer" data-id="a2a60c8" data-element_type="widget" data-widget_type="spacer.default">
				<div class="elementor-widget-container">
					<div class="elementor-spacer">
			<div class="elementor-spacer-inner"></div>
		</div>
				</div>
				</div>
				<div class="elementor-element elementor-element-de688f7 elementor-widget elementor-widget-heading" data-id="de688f7" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Conclusion </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-9f1b51c elementor-widget elementor-widget-text-editor" data-id="9f1b51c" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span data-contrast="auto">Understanding the </span><strong>data collection practices of LLM providers</strong><span data-contrast="auto"> is crucial for<b> </b></span><strong>AI compliance</strong><span data-contrast="auto">, customer trust, and corporate governance. Whether you&#8217;re focused on compliance, customer trust, or internal data governance, these insights help you make informed decisions. Choose providers that align with your privacy values &#8211; and always review your settings.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p><p><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p><p><span data-contrast="auto">Here&#8217;s a comparison of major platforms:</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-4597621 elementor-widget elementor-widget-html" data-id="4597621" data-element_type="widget" data-widget_type="html.default">
				<div class="elementor-widget-container">
			<style>
  table {
    width: 100%;
    border-collapse: collapse;
    font-family: 'Roboto', sans-serif;
    font-weight: 300;
    font-size: 14px;
    color: #1C244B;
  }
  th, td {
    border: 1px solid #ccc;
    padding: 8px;
    text-align: left;
    vertical-align: top;
  }
  th {
    background-color: #f2f2f2;
  }
  a {
    color: #1C244B;
    text-decoration: underline;
  }
</style>

<table>
  <thead>
    <tr>
      <th>Provider</th>
      <th>Default Data Training</th>
      <th>Web App Setting</th>
      <th>Data Residency Options</th>
      <th>GDPR/CCPA Compliance</th>
      <th>Privacy Policy</th>
    </tr>
  </thead>
  <tbody>
    <tr>
      <td>OpenAI</td>
      <td>No (API)</td>
      <td>Opt-out available</td>
      <td>No; (unless used via Azure Microsoft)</td>
      <td>Yes</td>
      <td><a href="https://openai.com/policies/privacy-policy" target="_blank">Consumer privacy</a></td>
    </tr>
    <tr>
      <td>Google</td>
      <td>No (Cloud + Gemini)</td>
      <td>No training by default</td>
      <td>Broad region control</td>
      <td>Yes</td>
      <td>
        <a href="https://policies.google.com/privacy" target="_blank">Enterprise privacy</a>, 
        <a href="https://www.google.com/intl/en_us/gemini/privacy" target="_blank">Gemini privacy</a>, 
        <a href="https://cloud.google.com/vertex-ai/docs/general/privacy-overview" target="_blank">Vertex AI</a>
      </td>
    </tr>
    <tr>
      <td>Azure</td>
      <td>No</td>
      <td>N/A</td>
      <td>Full regional control</td>
      <td>Yes</td>
      <td><a href="https://privacy.microsoft.com/en-us/privacystatement" target="_blank">Azure, OpenAI privacy</a></td>
    </tr>
    <tr>
      <td>Anthropic</td>
      <td>No</td>
      <td>No training by default</td>
      <td>No (unless used via partners)</td>
      <td>Yes</td>
      <td>
        <a href="https://www.anthropic.com/legal/privacy" target="_blank">API users</a>, 
        <a href="https://claude.ai/privacy" target="_blank">Claude.ai users</a>
      </td>
    </tr>
  </tbody>
</table>
		</div>
				</div>
				<div class="elementor-element elementor-element-5234314 elementor-widget elementor-widget-text-editor" data-id="5234314" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW227920897 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW227920897 BCX0">For maximum privacy and control, </span></span><span class="TextRun SCXW227920897 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW227920897 BCX0"><b>local deployment</b></span></span><span class="TextRun SCXW227920897 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW227920897 BCX0"><b> </b>(on-premises models) is always an alternative. This avoids cloud storage concerns entirely.</span><span class="NormalTextRun SCXW227920897 BCX0"> You can read more about local deployment </span></span><a class="Hyperlink SCXW227920897 BCX0" href="https://inero-software.com/deploying-llms-locally-a-guide-to-ollama-and-lm-studio/" target="_blank" rel="noreferrer noopener"><span class="TextRun Underlined SCXW227920897 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW227920897 BCX0" data-ccp-charstyle="Hyperlink">here</span></span></a><span class="TextRun SCXW227920897 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW227920897 BCX0">.</span></span><span class="EOP SCXW227920897 BCX0" data-ccp-props="{}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-7c7244d elementor-cta--skin-cover elementor-animated-content elementor-bg-transform elementor-bg-transform-zoom-in elementor-widget elementor-widget-call-to-action" data-id="7c7244d" data-element_type="widget" data-widget_type="call-to-action.default">
				<div class="elementor-widget-container">
					<div class="elementor-cta">
					<div class="elementor-cta__bg-wrapper">
				<div class="elementor-cta__bg elementor-bg" style="background-image: url(https://inero-software.com/wp-content/uploads/2025/03/cta-1903-1030x579.png);" role="img" aria-label="cta 1903"></div>
				<div class="elementor-cta__bg-overlay"></div>
			</div>
							<div class="elementor-cta__content">
				
									<h2 class="elementor-cta__title elementor-cta__content-item elementor-content-item elementor-animated-item--grow">
						Let's talk about AI agents 					</h2>
				
									<div class="elementor-cta__description elementor-cta__content-item elementor-content-item elementor-animated-item--grow">
						Ready to bring AI into your business? Let us help you get started.					</div>
				
									<div class="elementor-cta__button-wrapper elementor-cta__content-item elementor-content-item elementor-animated-item--grow">
					<a class="elementor-cta__button elementor-button elementor-size-" href="https://inero-software.com/contact-us/">
						Contact us					</a>
					</div>
							</div>
						</div>
				</div>
				</div>
					</div>
				</div>
				</div>
		<p>Artykuł <a href="https://inero-software.com/ai-user-privacy-an-analysis-of-platform-policies/">AI User Privacy: An Analysis of Platform Policies</a> pochodzi z serwisu <a href="https://inero-software.com">Inero Software - Software Consulting</a>.</p>
]]></content:encoded>
					
		
		
		<post-id xmlns="com-wordpress:feed-additions:1">7890</post-id>	</item>
		<item>
		<title>Top Lightweight LLMs for Local Deployment</title>
		<link>https://inero-software.com/top-lightweight-llms-for-local-deployment/</link>
		
		<dc:creator><![CDATA[Martyna Mul]]></dc:creator>
		<pubDate>Thu, 17 Apr 2025 09:50:46 +0000</pubDate>
				<category><![CDATA[AI]]></category>
		<category><![CDATA[Blog]]></category>
		<category><![CDATA[Company]]></category>
		<category><![CDATA[AI development]]></category>
		<category><![CDATA[Artificial Intelligence]]></category>
		<category><![CDATA[Large Language Model]]></category>
		<category><![CDATA[Lightweight LLMs]]></category>
		<category><![CDATA[LLM]]></category>
		<guid isPermaLink="false">https://inero-software.com/?p=7843</guid>

					<description><![CDATA[<p>In this post, we’ll explore several top open-source lightweight LLMs and how to run them on a local Windows PC—whether CPU-only or with a limited GPU—for document processing tasks. </p>
<p>Artykuł <a href="https://inero-software.com/top-lightweight-llms-for-local-deployment/">Top Lightweight LLMs for Local Deployment</a> pochodzi z serwisu <a href="https://inero-software.com">Inero Software - Software Consulting</a>.</p>
]]></description>
										<content:encoded><![CDATA[		<div data-elementor-type="wp-post" data-elementor-id="7843" class="elementor elementor-7843" data-elementor-post-type="post">
				<div class="elementor-element elementor-element-cc31ada e-flex e-con-boxed e-con e-parent" data-id="cc31ada" data-element_type="container">
					<div class="e-con-inner">
				<div class="elementor-element elementor-element-2485c29 elementor-widget elementor-widget-html" data-id="2485c29" data-element_type="widget" data-widget_type="html.default">
				<div class="elementor-widget-container">
					</div>
				</div>
				<div class="elementor-element elementor-element-d3520b4 elementor-widget elementor-widget-text-editor" data-id="d3520b4" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h5><strong><span class="TrackedChange SCXW35608661 BCX0"><span class="TextRun SCXW35608661 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun TrackChangeDeleteHighlight SCXW35608661 BCX0">Running large language models (LLMs) on your own hardware has become increasingly </span></span></span><span class="TrackedChange SCXW35608661 BCX0"><span class="TextRun SCXW35608661 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun TrackChangeDeleteHighlight SCXW35608661 BCX0">feasible</span></span></span><span class="TrackedChange SCXW35608661 BCX0"><span class="TextRun SCXW35608661 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun TrackChangeDeleteHighlight SCXW35608661 BCX0"> thanks to </span></span></span><span class="TextRun SCXW35608661 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW35608661 BCX0">lightweight LLMs</span><span class="NormalTextRun SCXW35608661 BCX0">—models w</span><span class="NormalTextRun SCXW35608661 BCX0">ith</span> <span class="NormalTextRun SCXW35608661 BCX0">relatively small</span><span class="NormalTextRun SCXW35608661 BCX0"> parameter counts that deliver </span><span class="NormalTextRun SCXW35608661 BCX0">strong performance</span><span class="NormalTextRun SCXW35608661 BCX0"> without requiring server-grade GPUs.</span><span class="NormalTextRun SCXW35608661 BCX0"> In this post, </span><span class="NormalTextRun SCXW35608661 BCX0">we’ll</span><span class="NormalTextRun SCXW35608661 BCX0"> explore several top open-source lightweight LLMs and how to run them on a local Windows PC—whether CPU-only or with a limited GPU—for document processing tasks.</span> </span><span class="TextRun SCXW35608661 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW35608661 BCX0">We also include a </span></span><span class="TextRun SCXW35608661 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW35608661 BCX0">benchmark comparing the models</span></span><span class="TextRun SCXW35608661 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW35608661 BCX0"> in terms of </span></span><span class="TextRun SCXW35608661 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW35608661 BCX0">accuracy and inference speed</span></span><span class="TextRun SCXW35608661 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW35608661 BCX0">, helping you choose the right model for your local environment and use case.</span></span><span class="EOP SCXW35608661 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:299,&quot;335559739&quot;:299}"> </span></strong></h5>						</div>
				</div>
				<div class="elementor-element elementor-element-10359f9 elementor-widget elementor-widget-heading" data-id="10359f9" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">What Are Lightweight LLMs (and Why Run Them Locally)? </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-621d40f elementor-widget elementor-widget-text-editor" data-id="621d40f" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW177302101 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW177302101 BCX0">“Lightweight” LLMs are models typically in the range of ~1–8 billion parameters – far smaller than GPT-3 class models – often optimized to run on a single GPU or even CPU. They are usually released as open models with freely available weights. These models trade some raw power for efficiency, but recent research and clever engineering (better data, distilled training, efficient attention mechanisms, etc.) have dramatically improved their capabilities. Many can now match or beat much larger models on specific benchmarks</span><span class="NormalTextRun SCXW177302101 BCX0">.</span></span><span class="EOP SCXW177302101 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-81497fe elementor-widget elementor-widget-text-editor" data-id="81497fe" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span data-contrast="auto">Local deployment of such models is valuable for several reasons:</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="1" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1"><strong>Privacy &amp; Security:</strong><span data-contrast="auto"> All data stays on your machine, which is crucial for confidential documents like insurance contracts. You’re not sending sensitive text to a third-party API.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="1" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="2" data-aria-level="1"><strong>Cost Savings:</strong><span data-contrast="auto"> Once downloaded, local models run </span><strong>for free</strong><span data-contrast="auto"> – no API usage fees or cloud compute bills. This can make a big difference if you process large volumes of documents regularly.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="1" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="3" data-aria-level="1"><strong>Latency &amp; Offline Access:</strong><span data-contrast="auto"> Local inference eliminates network latency. Responses can be near-instant on a GPU, and you can operate entirely offline. This is useful for on-site workflows or when internet access is restricted.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="1" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="4" data-aria-level="1"><strong>Customization:</strong><span data-contrast="auto"> With local models you have full control – you can adjust parameters, prompts, or fine-tune models to better fit your domain (e.g. insurance data) without vendor limits.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><p><span data-contrast="auto">In short, lightweight LLMs put AI capabilities directly in your hands, on hardware you own. Next, we’ll compare some of the leading open models that are well-suited for local document processing.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-6e958d1 elementor-widget elementor-widget-heading" data-id="6e958d1" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Comparing Top Lightweight LLMs </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-adbf2c8 elementor-widget elementor-widget-text-editor" data-id="adbf2c8" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW101152181 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW101152181 BCX0">Lightweight open-source large language models (LLMs) are becoming a practical choice for organizations looking to run AI workloads locally. They offer a strong balance between performance, speed, and resource requirements—making them ideal for document summarization, extraction, and classification without relying on cloud infrastructure. </span></span><span class="EOP SCXW101152181 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
					</div>
				</div>
		<div class="elementor-element elementor-element-330c9fe e-flex e-con-boxed e-con e-parent" data-id="330c9fe" data-element_type="container">
					<div class="e-con-inner">
				<div class="elementor-element elementor-element-73949bc elementor-widget elementor-widget-text-editor" data-id="73949bc" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span data-contrast="auto">We’ll focus on the following open-source models (each with downloadable checkpoints) that have a good reputation for quality relative to their size:</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-6703794 elementor-widget elementor-widget-text-editor" data-id="6703794" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li><strong>Llama 3.1</strong><span data-contrast="auto"> – 8B parameters (Meta AI)</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li><li data-leveltext="-" data-font="Aptos" data-listid="2" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="2" data-aria-level="1"><strong>StableLM Zephyr</strong><span data-contrast="auto"> – 3B parameters (Stability AI)</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="2" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="3" data-aria-level="1"><strong>Llama 3.2</strong><span data-contrast="auto"> – 1B/3B parameters (Meta AI)</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="2" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="4" data-aria-level="1"><strong>Mistral</strong><span data-contrast="auto"> – 7B parameters (Mistral AI)</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="2" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="5" data-aria-level="1"><strong>Gemma 3</strong><span data-contrast="auto"> – 1B and 4B variants (Google DeepMind)</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="2" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="6" data-aria-level="1"><strong>DeepSeek R1</strong><span data-contrast="auto"> – 1.5B and 7B variants (DeepSeek AI)</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="2" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="7" data-aria-level="1"><strong>Phi-4 Mini</strong><span data-contrast="auto"> – 3.8B parameters (Microsoft)</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="2" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="8" data-aria-level="1"><strong>TinyLlama</strong><span data-contrast="auto"> – 1.1B parameters (community project)</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-f98ca55 elementor-widget elementor-widget-text-editor" data-id="f98ca55" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><span data-contrast="auto">These models range from very small (under 1 GB on disk) to mid-sized (~5 GB). All can be run in inference mode on a 16 GB GPU (often even in half-precision or 4-bit quantized form) and many are workable on CPU with enough RAM and patience. Table 1 summarizes their characteristics:</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-71cd074 elementor-widget elementor-widget-html" data-id="71cd074" data-element_type="widget" data-widget_type="html.default">
				<div class="elementor-widget-container">
			<style>
  @import url('https://fonts.googleapis.com/css2?family=Roboto:wght@300&display=swap');

  .model-table {
    font-family: 'Roboto', sans-serif;
    font-weight: 300;
    font-size: 14px;
    color: #1C244B;
    border-collapse: collapse;
    width: 100%;
  }

  .model-table th, .model-table td {
    border: 1px solid #ccc;
    padding: 8px;
    text-align: left;
    color: #1C244B;
  }

  .model-table th {
    background-color: #f2f2f2;
  }
</style>

<table class="model-table">
  <thead>
    <tr>
      <th>Model</th>
      <th>Size on Disk (quantized)</th>
      <th>Max Context</th>
      <th>Licence</th>
    </tr>
  </thead>
  <tbody>
    <tr>
      <td>Llama 3.1 (8B)</td>
      <td>4.9GB</td>
      <td>128k tokens</td>
      <td>Open-source</td>
    </tr>
    <tr>
      <td>StableLM Zephyr (3B)</td>
      <td>1.6GB</td>
      <td>4k tokens</td>
      <td>Only non-commercial use</td>
    </tr>
    <tr>
      <td>Llama 3.2 (3B)</td>
      <td>2.0GB</td>
      <td>128k tokens</td>
      <td>Open-source</td>
    </tr>
    <tr>
      <td>Mistral (7B)</td>
      <td>4.1GB</td>
      <td>32k tokens</td>
      <td>Open-source (Apache 2.0)</td>
    </tr>
    <tr>
      <td>Gemma 3 (4B)</td>
      <td>3.3GB</td>
      <td>128k tokens</td>
      <td>Open-source</td>
    </tr>
    <tr>
      <td>Gemma 3 (1B)</td>
      <td>0.8GB</td>
      <td>32k tokens</td>
      <td>Open-source</td>
    </tr>
    <tr>
      <td>DeepSeek R1 (7B)</td>
      <td>4.7GB</td>
      <td>128k tokens</td>
      <td>Open-source (MIT licence)</td>
    </tr>
    <tr>
      <td>DeepSeek R1 (1.5B)</td>
      <td>1.1GB</td>
      <td>128k tokens</td>
      <td>Open-source (MIT licence)</td>
    </tr>
    <tr>
      <td>Phi-4 Mini (3.8B)</td>
      <td>2.5GB</td>
      <td>128k tokens</td>
      <td>Open-source</td>
    </tr>
    <tr>
      <td>TinyLlama (1.1B)</td>
      <td>0.6GB</td>
      <td>2k tokens</td>
      <td>Open-source</td>
    </tr>
  </tbody>
</table>
		</div>
				</div>
				<div class="elementor-element elementor-element-55c06b4 elementor-widget elementor-widget-text-editor" data-id="55c06b4" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h6><span class="TextRun SCXW254867370 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW254867370 BCX0">Table 1:</span></span><span class="TextRun SCXW254867370 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW254867370 BCX0"> Lightweight LLMs for local use – model sizes a</span><span class="NormalTextRun SCXW254867370 BCX0">nd</span> <span class="NormalTextRun SCXW254867370 BCX0">maximum</span><span class="NormalTextRun SCXW254867370 BCX0"> context windo</span><span class="NormalTextRun SCXW254867370 BCX0">w</span><span class="NormalTextRun SCXW254867370 BCX0">.</span></span><span class="EOP SCXW254867370 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></h6>						</div>
				</div>
				<div class="elementor-element elementor-element-58e51e9 elementor-widget elementor-widget-text-editor" data-id="58e51e9" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><strong><span class="TextRun SCXW7653520 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW7653520 BCX0">Notes:</span></span></strong><span class="TextRun SCXW7653520 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW7653520 BCX0"> “Max Context” is the maximum sequence length (tokens) the model can process in one go. </span></span><span class="EOP SCXW7653520 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-223eda5 elementor-widget elementor-widget-text-editor" data-id="223eda5" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW99345828 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW99345828 BCX0">Next, </span><span class="NormalTextRun SCXW99345828 BCX0">let’s</span><span class="NormalTextRun SCXW99345828 BCX0"> look at each model’s </span></span><span class="TextRun SCXW99345828 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW99345828 BCX0">pros and cons</span></span><span class="TextRun SCXW99345828 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW99345828 BCX0">, especially in the context of document tasks:</span></span><span class="EOP SCXW99345828 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-7192f01 elementor-widget elementor-widget-text-editor" data-id="7192f01" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="3" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1"><strong>Llama 3.1 (8B)</strong><span data-contrast="auto"><strong>:</strong> Powerful general-purpose model; moderate size and strong multilingual capabilities. Heavy for CPU-only systems; requires chunking for long documents.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="3" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="2" data-aria-level="1"><strong>StableLM Zephyr (3B)</strong><span data-contrast="auto"><strong>:</strong> Ultra-lightweight, good for basic QA/extraction. Limited by small parameter count and commercial license restrictions.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="3" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="3" data-aria-level="1"><strong>Llama 3.2 (3B)</strong><span data-contrast="auto">: Excellent summarization and retrieval; long context support (128k tokens). Smaller size affects complex reasoning accuracy.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="3" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="4" data-aria-level="1"><strong>Mistral (7B)</strong><span data-contrast="auto"><strong>:</strong> Best overall performer for its size; highly efficient inference. Ideal for detailed summarization tasks.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="3" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="5" data-aria-level="1"><strong>Gemma 3 (4B/1B)</strong><span data-contrast="auto">: Offers multimodal capabilities and extensive multilingual support. The 4B model balances capability and speed; the 1B model best suited for simple tasks.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="3" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="6" data-aria-level="1"><strong>DeepSeek R1 (7B/1.5B)</strong><span data-contrast="auto">: Balanced efficiency and comprehension for general NLP tasks; limited complex reasoning compared to Mistral.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="3" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="7" data-aria-level="1"><strong>Phi-4 Mini (3.8B)</strong><span data-contrast="auto">: Exceptional reasoning, math, and logical capabilities; perfect for analytical document processing. English-focused.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="3" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:1080,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="8" data-aria-level="1"><strong>TinyLlama (1.1B)</strong><span data-contrast="auto">: Extremely lightweight; suitable for basic text extraction/classification tasks. Limited contextual understanding.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-906c9d8 elementor-widget elementor-widget-text-editor" data-id="906c9d8" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW259074413 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW259074413 BCX0">The models reviewed above cover a wide range of sizes and capabilities. Larger variants like Llama 3.1 and Mistral perform well on complex summarization and multilingual tasks but are less suited for CPU-only setups. Mid-sized models such as Llama 3.2 and Gemma 3 (4B) handle long inputs efficiently with reasonable performance. Smaller models, including </span><span class="NormalTextRun SpellingErrorV2Themed SCXW259074413 BCX0">TinyLlama</span><span class="NormalTextRun SCXW259074413 BCX0"> and </span><span class="NormalTextRun SpellingErrorV2Themed SCXW259074413 BCX0">StableLM</span><span class="NormalTextRun SCXW259074413 BCX0"> Zephyr, are lightweight and fast, making them practical for basic extraction or classification tasks.</span></span><span class="EOP SCXW259074413 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-013ecbc elementor-widget elementor-widget-heading" data-id="013ecbc" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Models Benchmarking: Document Extraction and Summarization </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-f583b4c elementor-widget elementor-widget-text-editor" data-id="f583b4c" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW65580225 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW65580225 BCX0">Here we outline a simple </span><span class="NormalTextRun SCXW65580225 BCX0">model </span><span class="NormalTextRun SCXW65580225 BCX0">benchmarking plan covering t</span><span class="NormalTextRun SCXW65580225 BCX0">wo</span><span class="NormalTextRun SCXW65580225 BCX0"> common document-processing tasks:</span></span><span class="EOP SCXW65580225 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-236155a elementor-widget elementor-widget-text-editor" data-id="236155a" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ol><li><strong> Information Extraction:</strong><span data-contrast="auto"> We evaluated how well each model can extract specific fields from a policy or certificate. Specifically, we prompted each model to find the </span><b><span data-contrast="auto">p</span></b><strong>olicy number, insured name</strong><span data-contrast="auto"><strong>,</strong> VAT ID, address and insurance period in the document text and return the structured output &#8211; clean JSON response with all the needed values.</span></li><li><strong> Summarization: </strong><span data-contrast="auto">Each model generated a concise summary of an insurance policy, covering key points such as coverage, exclusions, and conditions.We rated the summaries on clarity, correctness, factual accuracy and readability and penalized heavily fabricating information.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ol>						</div>
				</div>
				<div class="elementor-element elementor-element-02421da elementor-widget elementor-widget-text-editor" data-id="02421da" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW43958002 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun CommentStart SCXW43958002 BCX0">We used 11 document</span><span class="NormalTextRun SCXW43958002 BCX0">s</span><span class="NormalTextRun SCXW43958002 BCX0"> and</span><span class="NormalTextRun SCXW43958002 BCX0"> </span><span class="NormalTextRun SCXW43958002 BCX0">ran all t</span><span class="NormalTextRun SCXW43958002 BCX0">ests using </span></span><span class="TextRun SCXW43958002 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SpellingErrorV2Themed SCXW43958002 BCX0">Ollama</span></span><span class="TextRun SCXW43958002 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW43958002 BCX0"> <a href="https://inero-software.com/deploying-llms-locally-a-guide-to-ollama-and-lm-studio/">(</a></span><span class="NormalTextRun SCXW43958002 BCX0">you can read about </span><span class="NormalTextRun SCXW43958002 BCX0">running model with </span><span class="NormalTextRun SpellingErrorV2Themed SCXW43958002 BCX0">Ollama</span> <span class="NormalTextRun CommentStart SCXW43958002 BCX0">here</span><span class="NormalTextRun SCXW43958002 BCX0">)</span><span class="NormalTextRun SCXW43958002 BCX0">.</span><span class="NormalTextRun SCXW43958002 BCX0"> </span><span class="NormalTextRun SCXW43958002 BCX0">The benchmarks were performed on a PC equipped with an</span><span class="NormalTextRun SCXW43958002 BCX0"> NVIDIA </span><span class="NormalTextRun SCXW43958002 BCX0">GeForce RTX 2060 </span><span class="NormalTextRun SCXW43958002 BCX0">and </span><span class="NormalTextRun SCXW43958002 BCX0">6</span><span class="NormalTextRun SCXW43958002 BCX0"> GB </span><span class="NormalTextRun SCXW43958002 BCX0">V</span><span class="NormalTextRun SCXW43958002 BCX0">RAM.</span> <span class="NormalTextRun SCXW43958002 BCX0">To ensure consistent results, each model was run with </span></span><span class="TextRun SCXW43958002 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW43958002 BCX0">temperature set to 0</span></span><span class="TextRun SCXW43958002 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW43958002 BCX0"> for the extraction task (to produce deterministic outputs), and with a fixed </span></span><span class="TextRun SCXW43958002 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW43958002 BCX0">temperature of 0.7</span></span><span class="TextRun SCXW43958002 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW43958002 BCX0"> for summarization. For the extraction task, we also used </span></span><a class="Hyperlink SCXW43958002 BCX0" href="https://ollama.com/blog/structured-outputs" target="_blank" rel="noreferrer noopener"><span class="TextRun Underlined SCXW43958002 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW43958002 BCX0" data-ccp-charstyle="Hyperlink">structured outputs</span></span></a><span class="TextRun SCXW43958002 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW43958002 BCX0">:</span> </span><span class="EOP SCXW43958002 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;201341983&quot;:0,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335557856&quot;:16777215,&quot;335559738&quot;:0,&quot;335559739&quot;:0,&quot;335559740&quot;:270}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-f1a279a elementor-widget elementor-widget-text-editor" data-id="f1a279a" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<pre> <br /><br /><span data-contrast="none">{</span> <br /><span data-contrast="none">        </span><span data-contrast="none">"model"</span><span data-contrast="none">: </span><span data-contrast="none">"deepseek-r1:7b"</span><span data-contrast="none">,</span> <br /><span data-contrast="none">        </span><span data-contrast="none">"prompt"</span><span data-contrast="none">: </span><span data-contrast="none">"You are an assistant that extracts insurance-related information from a given input text. You must extract and return only the following fields: - policy_number,- insurance_period,- insured (company or person name),- nip (tax identification number),- address (of the insured). Return the output as a **clean JSON object** — not as a string, not inside quotes, and without any commentary. If a field is missing, use 'Not found'. Document text: "</span><span data-contrast="none">,</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;201341983&quot;:0,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335557856&quot;:16777215,&quot;335559738&quot;:0,&quot;335559739&quot;:0,&quot;335559740&quot;:270}"> </span><br /><br /><span data-contrast="none">    </span><span data-contrast="none">"stream"</span><span data-contrast="none">: </span><b><span data-contrast="none">false</span></b><span data-contrast="none">,</span> <br /><span data-contrast="none">    </span><span data-contrast="none">"format"</span><span data-contrast="none">: {</span> <br /><span data-contrast="none">    </span><span data-contrast="none">"type"</span><span data-contrast="none">: </span><span data-contrast="none">"object"</span><span data-contrast="none">,</span> <br /><span data-contrast="none">    </span><span data-contrast="none">"properties"</span><span data-contrast="none">: {</span> <br /><span data-contrast="none">      </span><span data-contrast="none">"policy_number"</span><span data-contrast="none">: {</span> <br /><span data-contrast="none">        </span><span data-contrast="none">"type"</span><span data-contrast="none">: </span><span data-contrast="none">"string"</span> <br /><span data-contrast="none">      },</span> <br /><span data-contrast="none">      </span><span data-contrast="none">"insurance_period_start"</span><span data-contrast="none">: {</span> <br /><span data-contrast="none">        </span><span data-contrast="none">"type"</span><span data-contrast="none">: </span><span data-contrast="none">"string"</span> <br /><span data-contrast="none">      },</span> <br /><span data-contrast="none">      </span><span data-contrast="none">"insurance_period_end"</span><span data-contrast="none">: {</span> <br /><span data-contrast="none">        </span><span data-contrast="none">"type"</span><span data-contrast="none">: </span><span data-contrast="none">"string"</span> <br /><span data-contrast="none">      },</span> <br /><span data-contrast="none">      </span><span data-contrast="none">"insured"</span><span data-contrast="none">: {</span> <br /><span data-contrast="none">        </span><span data-contrast="none">"type"</span><span data-contrast="none">: </span><span data-contrast="none">"string"</span> <br /><span data-contrast="none">      },</span> <br /><span data-contrast="none">      </span><span data-contrast="none">"insured_nip"</span><span data-contrast="none">: {</span> <br /><span data-contrast="none">        </span><span data-contrast="none">"type"</span><span data-contrast="none">: </span><span data-contrast="none">"string"</span> <br /><span data-contrast="none">      },</span> <br /><span data-contrast="none">      </span><span data-contrast="none">"insured_address"</span><span data-contrast="none">: {</span> <br /><span data-contrast="none">        </span><span data-contrast="none">"type"</span><span data-contrast="none">: </span><span data-contrast="none">"string"</span> <br /><span data-contrast="none">      }</span> <br /><span data-contrast="none">    },</span> <br /><span data-contrast="none">    </span><span data-contrast="none">"required"</span><span data-contrast="none">: [</span> <br /><span data-contrast="none">      </span><span data-contrast="none">"policy_number"</span><span data-contrast="none">,</span> <br /><span data-contrast="none">      </span><span data-contrast="none">"insurance_period_start"</span><span data-contrast="none">, </span> <br /><span data-contrast="none">      </span><span data-contrast="none">"insurance_period_end"</span><span data-contrast="none">,</span> <br /><span data-contrast="none">      </span><span data-contrast="none">"insured"</span><span data-contrast="none">,</span> <br /><span data-contrast="none">      </span><span data-contrast="none">"insured_nip"</span><span data-contrast="none">,</span> <br /><span data-contrast="none">      </span><span data-contrast="none">"insured_address"</span> <br /><span data-contrast="none">    ]</span> <br /><span data-contrast="none">  }</span> <br /><span data-contrast="none">}</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;201341983&quot;:0,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335557856&quot;:16777215,&quot;335559738&quot;:0,&quot;335559739&quot;:0,&quot;335559740&quot;:270}"> </span></pre>						</div>
				</div>
				<div class="elementor-element elementor-element-a6fbca0 elementor-widget elementor-widget-image" data-id="a6fbca0" data-element_type="widget" data-widget_type="image.default">
				<div class="elementor-widget-container">
													<img loading="lazy" decoding="async" data-attachment-id="7846" data-permalink="https://inero-software.com/top-lightweight-llms-for-local-deployment/attachment/111553/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/04/111553.png" data-orig-size="1154,649" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="111553" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/04/111553-300x169.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/04/111553-1030x579.png" tabindex="0" role="button" width="1030" height="579" src="https://inero-software.com/wp-content/uploads/2025/04/111553-1030x579.png" class="attachment-large size-large wp-image-7846" alt="" srcset="https://inero-software.com/wp-content/uploads/2025/04/111553-1030x579.png 1030w, https://inero-software.com/wp-content/uploads/2025/04/111553-300x169.png 300w, https://inero-software.com/wp-content/uploads/2025/04/111553-768x432.png 768w, https://inero-software.com/wp-content/uploads/2025/04/111553-533x300.png 533w, https://inero-software.com/wp-content/uploads/2025/04/111553.png 1154w" sizes="(max-width: 1030px) 100vw, 1030px" data-attachment-id="7846" data-permalink="https://inero-software.com/top-lightweight-llms-for-local-deployment/attachment/111553/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/04/111553.png" data-orig-size="1154,649" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="111553" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/04/111553-300x169.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/04/111553-1030x579.png" role="button" />													</div>
				</div>
				<div class="elementor-element elementor-element-c923f73 elementor-widget elementor-widget-text-editor" data-id="c923f73" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h6><span class="TextRun SCXW85460195 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW85460195 BCX0">Examples of insurance </span><span class="NormalTextRun SCXW85460195 BCX0">certifacates</span><span class="NormalTextRun SCXW85460195 BCX0">.</span></span><span class="EOP SCXW85460195 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></h6>						</div>
				</div>
				<div class="elementor-element elementor-element-e9e7e62 elementor-widget elementor-widget-text-editor" data-id="e9e7e62" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><strong><span class="TextRun SCXW36022441 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW36022441 BCX0">The table below presents the benchmark results.</span></span></strong> <span class="TextRun SCXW36022441 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW36022441 BCX0">Extraction accuracy</span></span><span class="TextRun SCXW36022441 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW36022441 BCX0"> refers to the number of documents (out of 11) where the model successfully extracted all key fields. </span></span><span class="TextRun SCXW36022441 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW36022441 BCX0">Token/sec</span></span><span class="TextRun SCXW36022441 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"> <span class="NormalTextRun SCXW36022441 BCX0">indicates</span><span class="NormalTextRun SCXW36022441 BCX0"> the model’s inference speed — how quickly it generates responses.</span></span><span class="EOP SCXW36022441 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-e5f35c8 elementor-widget elementor-widget-html" data-id="e5f35c8" data-element_type="widget" data-widget_type="html.default">
				<div class="elementor-widget-container">
			<style>
  @import url('https://fonts.googleapis.com/css2?family=Roboto:wght@300&display=swap');

  .model-table {
    font-family: 'Roboto', sans-serif;
    font-weight: 300;
    font-size: 14px;
    color: #1C244B;
    border-collapse: collapse;
    width: 100%;
  }

  .model-table th, .model-table td {
    border: 1px solid #ccc;
    padding: 8px;
    text-align: left;
    color: #1C244B;
  }

  .model-table th {
    background-color: #f2f2f2;
  }

  .green-bg {
    background-color: #DFF0D8;
  }

  .red-bg {
    background-color: #F2DEDE;
  }
</style>

<table class="model-table">
  <thead>
    <tr>
      <th>Model</th>
      <th>Summarization</th>
      <th>Extraction Accuracy</th>
      <th>Tokens/sec</th>
    </tr>
  </thead>
  <tbody>
    <tr>
      <td>Llama 3.1 (8B)</td>
      <td class="green-bg">High-quality, no hallucinations</td>
      <td>10/11</td>
      <td>13.49</td>
    </tr>
    <tr>
      <td>StableLM 3B</td>
      <td class="red-bg">Average quality, typos/hallucinations</td>
      <td>4/11</td>
      <td>56.51</td>
    </tr>
    <tr>
      <td>Llama 3.2 (3B)</td>
      <td class="green-bg">Concise yet comprehensive summary, no hallucinations</td>
      <td>8/11</td>
      <td>49.49</td>
    </tr>
    <tr>
      <td>Mistral 7B</td>
      <td>Extensive summary, factually correct</td>
      <td>8/11</td>
      <td>29.01</td>
    </tr>
    <tr>
      <td>Gemma 3 4B</td>
      <td class="green-bg">Concise yet comprehensive summary, no hallucinations</td>
      <td>10/11</td>
      <td>13.37</td>
    </tr>
    <tr>
      <td>Gemma 3 1B</td>
      <td class="green-bg">Concise yet comprehensive summary, no hallucinations</td>
      <td>4/11</td>
      <td>73.46</td>
    </tr>
    <tr>
      <td>DeepSeek 7B</td>
      <td class="green-bg">Concise yet comprehensive summary, no hallucinations</td>
      <td>6/11</td>
      <td>16.39</td>
    </tr>
    <tr>
      <td>DeepSeek 1.5B</td>
      <td class="red-bg">Very poor, frequent hallucinations/errors</td>
      <td>0/11</td>
      <td>66.45</td>
    </tr>
    <tr>
      <td>Phi-4 Mini 3.8B</td>
      <td>Very concise summaries, factually correct</td>
      <td>9/11</td>
      <td>39.31</td>
    </tr>
    <tr>
      <td>TinyLlama 1.1B</td>
      <td class="red-bg">Poor quality, severe hallucinations</td>
      <td>2/11</td>
      <td>107.34</td>
    </tr>
  </tbody>
</table>
		</div>
				</div>
				<div class="elementor-element elementor-element-4f30579 elementor-widget elementor-widget-text-editor" data-id="4f30579" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h6><span class="TextRun SCXW220458249 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW220458249 BCX0">Table 2: </span><span class="NormalTextRun SCXW220458249 BCX0">B</span><span class="NormalTextRun SCXW220458249 BCX0">enchmarking results.</span></span><span class="TextRun SCXW220458249 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW220458249 BCX0"> </span></span><span class="EOP SCXW220458249 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></h6>						</div>
				</div>
				<div class="elementor-element elementor-element-1046393 elementor-widget elementor-widget-image" data-id="1046393" data-element_type="widget" data-widget_type="image.default">
				<div class="elementor-widget-container">
													<img loading="lazy" decoding="async" data-attachment-id="7847" data-permalink="https://inero-software.com/top-lightweight-llms-for-local-deployment/lightweight-llm-scatterplot/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/04/lightweight-llm-scatterplot.png" data-orig-size="1968,1180" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="lightweight-llm-scatterplot" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/04/lightweight-llm-scatterplot-300x180.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/04/lightweight-llm-scatterplot-1030x618.png" tabindex="0" role="button" width="1030" height="618" src="https://inero-software.com/wp-content/uploads/2025/04/lightweight-llm-scatterplot-1030x618.png" class="attachment-large size-large wp-image-7847" alt="" srcset="https://inero-software.com/wp-content/uploads/2025/04/lightweight-llm-scatterplot-1030x618.png 1030w, https://inero-software.com/wp-content/uploads/2025/04/lightweight-llm-scatterplot-300x180.png 300w, https://inero-software.com/wp-content/uploads/2025/04/lightweight-llm-scatterplot-768x460.png 768w, https://inero-software.com/wp-content/uploads/2025/04/lightweight-llm-scatterplot-1536x921.png 1536w, https://inero-software.com/wp-content/uploads/2025/04/lightweight-llm-scatterplot-500x300.png 500w, https://inero-software.com/wp-content/uploads/2025/04/lightweight-llm-scatterplot.png 1968w" sizes="(max-width: 1030px) 100vw, 1030px" data-attachment-id="7847" data-permalink="https://inero-software.com/top-lightweight-llms-for-local-deployment/lightweight-llm-scatterplot/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/04/lightweight-llm-scatterplot.png" data-orig-size="1968,1180" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="lightweight-llm-scatterplot" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/04/lightweight-llm-scatterplot-300x180.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/04/lightweight-llm-scatterplot-1030x618.png" role="button" />													</div>
				</div>
				<div class="elementor-element elementor-element-704e9c5 elementor-widget elementor-widget-text-editor" data-id="704e9c5" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW241422309 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW241422309 BCX0">This scatterplot visualizes the </span></span><span class="TextRun SCXW241422309 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW241422309 BCX0">trade-off between extraction accuracy and inference speed</span></span><span class="TextRun SCXW241422309 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW241422309 BCX0"> (measured in tokens per second)</span></span><span class="EOP SCXW241422309 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-5527166 elementor-widget elementor-widget-text-editor" data-id="5527166" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span data-contrast="auto">The benchmarking results reveal significant variations among the tested models. </span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559685&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="6" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1"><strong>Bottom-right</strong><span data-contrast="auto"> models &#8211; </span><strong>Llama 3.1 (8B), Gemma 3 (4B)</strong><span data-contrast="auto">, and </span><strong>Phi-4 Mini (3.8B)</strong> <span data-contrast="auto">&#8211; </span><span data-contrast="auto">excel in summarization quality and extraction accuracy, consistently providing concise and accurate outputs. Phi-4 Mini seems to offer a good trade-off between speed and accuracy.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="6" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="2" data-aria-level="1"><strong>Mistral 7B, DeepSeek 7B, Llama 3.2</strong><span data-contrast="auto"> generate detailed and informative summaries, though their extraction performance is more moderate.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="-" data-font="Aptos" data-listid="6" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Aptos&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;-&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="3" data-aria-level="1"><span data-contrast="auto">On the other hand, </span><strong>smaller models</strong> <span data-contrast="auto">(on the top-left side of the chart) like </span><strong><i>StableLM Zephyr (3B), Gemma 3 (1B)</i> and <i>TinyLlama</i></strong><i><span data-contrast="auto"> (1.1B)</span></i><span data-contrast="auto"> show significantly weaker extraction accuracy and are prone to frequent hallucinations. However, they benefit from faster inference times. Their limited context windows (e.g., 4k tokens) may contribute to these shortcomings. Overall, they may be suitable for only very basic tasks.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-1ac20ae elementor-widget elementor-widget-heading" data-id="1ac20ae" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Choosing the Right Model for Your Needs </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-11e1bfc elementor-widget elementor-widget-text-editor" data-id="11e1bfc" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW204701935 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW204701935 BCX0">When selecting a language model for document extraction or summarization, </span><span class="NormalTextRun SCXW204701935 BCX0">it’s</span><span class="NormalTextRun SCXW204701935 BCX0"> all about balancing </span></span><span class="TextRun SCXW204701935 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW204701935 BCX0">accuracy</span></span><span class="TextRun SCXW204701935 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW204701935 BCX0">, </span></span><span class="TextRun SCXW204701935 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW204701935 BCX0">speed</span></span><span class="TextRun SCXW204701935 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW204701935 BCX0">, and </span></span><span class="TextRun SCXW204701935 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW204701935 BCX0">hardware constraints</span></span><span class="TextRun SCXW204701935 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW204701935 BCX0">. Below is a quick breakdown to help you pick the best fit—whether you need high precision, fast inference, or something lightweight for basic tasks.</span></span><span class="EOP SCXW204701935 BCX0" data-ccp-props="{}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-689718c elementor-widget elementor-widget-text-editor" data-id="689718c" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="4" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1"><strong>High Accuracy &amp; Reasonable Speed:</strong><span data-contrast="auto"> Choose </span><strong>Phi-4 Mini (3.8B), Gemma 3 (4B)</strong><span data-contrast="auto">, or </span><strong>Llama 3.1 (8B)</strong><span data-contrast="auto"> for robust extraction and summarization accuracy.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="4" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="2" data-aria-level="1"><strong>Fast Inference &amp; Moderate Accuracy:</strong><span data-contrast="auto"> Opt for </span><strong>Llama 3.2 (3B)</strong><span data-contrast="auto"> or </span><strong>StableLM Zephyr (3B)</strong><span data-contrast="auto"> for simpler tasks on limited hardware.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="4" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="3" data-aria-level="1"><strong>Balanced Performance (Accuracy-Speed Tradeoff): Mistral (7B)</strong><span data-contrast="auto"> provides strong general-purpose capability suitable for detailed document summarization tasks.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="4" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="4" data-aria-level="1"><strong>Low Resource Environments (Basic Tasks):</strong><span data-contrast="auto"> Consider </span><strong>TinyLlama (1.1B)</strong><span data-contrast="auto"> for quick extraction or classification on minimal hardware if accuracy isn&#8217;t critical.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-ee4c212 elementor-widget elementor-widget-heading" data-id="ee4c212" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Conclusion </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-510ec3a elementor-widget elementor-widget-text-editor" data-id="510ec3a" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW44846787 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW44846787 BCX0">Lightweight LLMs are increasingly </span><span class="NormalTextRun SCXW44846787 BCX0">viable</span><span class="NormalTextRun SCXW44846787 BCX0"> solutions for local deployment, particularly in document-intensive industries such as insurance. Models such as Phi-4 Mini, Gemma 3 (4B), and Mistral 7B provide </span><span class="NormalTextRun SCXW44846787 BCX0">strong performance</span><span class="NormalTextRun SCXW44846787 BCX0"> in summarization, extraction, and classification tasks. Carefully balancing model size, inference speed, and accuracy ensures </span><span class="NormalTextRun SCXW44846787 BCX0">optimal</span><span class="NormalTextRun SCXW44846787 BCX0"> outcomes, empowering organizations with affordable, private, and responsive AI solutions directly on owned hardware.</span></span><span class="EOP SCXW44846787 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-8874a86 elementor-cta--skin-cover elementor-animated-content elementor-bg-transform elementor-bg-transform-zoom-in elementor-widget elementor-widget-call-to-action" data-id="8874a86" data-element_type="widget" data-widget_type="call-to-action.default">
				<div class="elementor-widget-container">
					<a class="elementor-cta" href="https://inero-software.com/optimization-of-back-office-processes-with-ai-agent-implementation-a-practical-example/">
					<div class="elementor-cta__bg-wrapper">
				<div class="elementor-cta__bg elementor-bg" style="background-image: url(https://inero-software.com/wp-content/uploads/2025/03/cta-1903-1030x579.png);" role="img" aria-label="cta 1903"></div>
				<div class="elementor-cta__bg-overlay"></div>
			</div>
							<div class="elementor-cta__content">
				
									<h2 class="elementor-cta__title elementor-cta__content-item elementor-content-item elementor-animated-item--grow">
						This might interest you					</h2>
				
									<div class="elementor-cta__description elementor-cta__content-item elementor-content-item elementor-animated-item--grow">
						Optimization of Back-Office Processes with AI Agent Implementation: A Practical Example					</div>
				
									<div class="elementor-cta__button-wrapper elementor-cta__content-item elementor-content-item elementor-animated-item--grow">
					<span class="elementor-cta__button elementor-button elementor-size-">
						Read the full text					</span>
					</div>
							</div>
						</a>
				</div>
				</div>
					</div>
				</div>
				</div>
		<p>Artykuł <a href="https://inero-software.com/top-lightweight-llms-for-local-deployment/">Top Lightweight LLMs for Local Deployment</a> pochodzi z serwisu <a href="https://inero-software.com">Inero Software - Software Consulting</a>.</p>
]]></content:encoded>
					
		
		
		<post-id xmlns="com-wordpress:feed-additions:1">7843</post-id>	</item>
		<item>
		<title>How to Prepare Your Company for AI Agent Implementation</title>
		<link>https://inero-software.com/how-to-prepare-your-company-for-ai-agent-implementation/</link>
		
		<dc:creator><![CDATA[Marta Kuprasz]]></dc:creator>
		<pubDate>Tue, 08 Apr 2025 08:45:46 +0000</pubDate>
				<category><![CDATA[AI]]></category>
		<category><![CDATA[Blog]]></category>
		<category><![CDATA[Company]]></category>
		<category><![CDATA[Ai agent]]></category>
		<category><![CDATA[AI development]]></category>
		<category><![CDATA[AI innovations]]></category>
		<category><![CDATA[Artificial Intelligence]]></category>
		<category><![CDATA[BusinessProcessesOptimization]]></category>
		<category><![CDATA[LLM]]></category>
		<guid isPermaLink="false">https://inero-software.com/?p=7741</guid>

					<description><![CDATA[<p>This article explains what to focus on before deploying an AI agent, which areas of the business need to be well-prepared, and how to avoid common mistakes.</p>
<p>Artykuł <a href="https://inero-software.com/how-to-prepare-your-company-for-ai-agent-implementation/">How to Prepare Your Company for AI Agent Implementation</a> pochodzi z serwisu <a href="https://inero-software.com">Inero Software - Software Consulting</a>.</p>
]]></description>
										<content:encoded><![CDATA[		<div data-elementor-type="wp-post" data-elementor-id="7741" class="elementor elementor-7741" data-elementor-post-type="post">
				<div class="elementor-element elementor-element-baa7356 e-flex e-con-boxed e-con e-parent" data-id="baa7356" data-element_type="container">
					<div class="e-con-inner">
				<div class="elementor-element elementor-element-e8f2a57 elementor-widget elementor-widget-html" data-id="e8f2a57" data-element_type="widget" data-widget_type="html.default">
				<div class="elementor-widget-container">
			 		</div>
				</div>
				<div class="elementor-element elementor-element-a583053 elementor-widget elementor-widget-text-editor" data-id="a583053" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h4>Implementing an AI agent in a company is not only a technological challenge but also a strategic one. As more businesses consider using artificial intelligence in their daily operations—from customer service to document analysis—successful implementation requires careful planning. This article explains what to focus on before deploying an AI agent, which areas of the business need to be well-prepared, and how to avoid common mistakes.</h4>						</div>
				</div>
				<div class="elementor-element elementor-element-068de27 elementor-widget elementor-widget-text-editor" data-id="068de27" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>There are many areas where AI can be helpful. From automating routine tasks, supporting customer service and data analysis, to streamlining decision-making processes and creating intelligent assistants that support team workflows. The potential is enormous—but the key lies in properly preparing the organization for this change.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-37b67aa elementor-widget elementor-widget-heading" data-id="37b67aa" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Stages of AI Assistant Implementation</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-42d1b2e elementor-widget elementor-widget-text-editor" data-id="42d1b2e" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>The process of implementing an AI assistant in an organization can be divided into several stages, each requiring specific actions. From analyzing business needs, selecting the right language model, and preparing the infrastructure, to integrating with existing systems and testing—each step impacts the overall effectiveness of the solution.</p><p>The key stages are:</p>						</div>
				</div>
				<div class="elementor-element elementor-element-10d35ec elementor-widget elementor-widget-text-editor" data-id="10d35ec" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ol><li data-leveltext="%1." data-font="" data-listid="1" data-list-defn-props="{&quot;335552541&quot;:0,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769242&quot;:[65533,0],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;%1.&quot;,&quot;469777815&quot;:&quot;multilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1">Needs analysis and readiness assessment</li><li data-leveltext="%1." data-font="" data-listid="1" data-list-defn-props="{&quot;335552541&quot;:0,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769242&quot;:[65533,0],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;%1.&quot;,&quot;469777815&quot;:&quot;multilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1">Data and content preparation</li><li data-leveltext="%1." data-font="" data-listid="1" data-list-defn-props="{&quot;335552541&quot;:0,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769242&quot;:[65533,0],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;%1.&quot;,&quot;469777815&quot;:&quot;multilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1">Solution design</li><li data-leveltext="%1." data-font="" data-listid="1" data-list-defn-props="{&quot;335552541&quot;:0,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769242&quot;:[65533,0],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;%1.&quot;,&quot;469777815&quot;:&quot;multilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1">Assistant development and configuration</li><li data-leveltext="%1." data-font="" data-listid="1" data-list-defn-props="{&quot;335552541&quot;:0,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769242&quot;:[65533,0],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;%1.&quot;,&quot;469777815&quot;:&quot;multilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1">Testing and pilot phase</li><li data-leveltext="%1." data-font="" data-listid="1" data-list-defn-props="{&quot;335552541&quot;:0,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769242&quot;:[65533,0],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;%1.&quot;,&quot;469777815&quot;:&quot;multilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1">Deployment and maintenance</li></ol>						</div>
				</div>
				<div class="elementor-element elementor-element-bc457df elementor-widget elementor-widget-heading" data-id="bc457df" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Needs analysis and readiness assessment</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-52ccfa0 elementor-widget elementor-widget-text-editor" data-id="52ccfa0" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>To ensure the best results from implementing an AI agent, start by asking yourself: which tasks and areas have the most potential for optimization through the use of artificial intelligence?</p>						</div>
				</div>
				<div class="elementor-element elementor-element-2092bd9 elementor-widget elementor-widget-text-editor" data-id="2092bd9" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>When looking for an answer to this question, it’s worth carefully analyzing your company’s current structure, processes, and employee responsibilities. This will help identify so-called “bottlenecks” that may affect the quality of services provided. These might include, for example:</p><ul><li style="list-style-type: none;"><ul><li><p>long response times to quote requests</p></li><li><p>teams overloaded with routine tasks</p></li><li><p>lack of consistency in customer communication</p></li><li><p>manual processing of documents and data</p></li><li><p>difficulties in quickly accessing internal company knowledge</p></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-bb5fac4 elementor-widget elementor-widget-text-editor" data-id="bb5fac4" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>Based on this analysis, you’ll be able to identify areas for improvement as well as the people who will directly benefit from the support of AI assistants.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-9a37800 elementor-widget elementor-widget-text-editor" data-id="9a37800" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>The second area that should be reviewed is the existing infrastructure. Implementing an AI assistant doesn’t require a large amount of hardware. If the company doesn’t want to invest in new machines, it can opt to use cloud services such as Azure, AWS, or Google Cloud.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-aacf051 elementor-widget elementor-widget-text-editor" data-id="aacf051" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>Data is a crucial part of the preparation process. To fully leverage the potential of dedicated AI solutions, it’s important to understand that training the model behind the assistant requires datasets stored in digital form. These should be well-organized and kept in a central repository or database. The less structured the data, the higher the cost of implementing the assistant—and the greater the risk that the solution won’t meet expectations.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-60b308a elementor-widget elementor-widget-heading" data-id="60b308a" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Data and content preparation</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-255b41d elementor-widget elementor-widget-text-editor" data-id="255b41d" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>At this stage, it’s essential to gather all materials that contain important company knowledge—this may include PDF, Word, and Excel documents, website content, FAQ sections, emails, or data from databases.</p><p> </p><p>Next, the collected information needs to be properly prepared—organized, cleaned of unnecessary content (e.g., unreadable PDFs), standardized where possible, and exported to CSV or JSON files (e.g., emails).</p><p> </p><p>In some cases, such as when planning further model customization (fine-tuning), it will also be necessary to label the data or prepare a dedicated training set in the form of instructions and expected responses, for example:</p>						</div>
				</div>
				<div class="elementor-element elementor-element-b8339ff elementor-widget elementor-widget-text-editor" data-id="b8339ff" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<pre>{"prompt": "What documents are required to sign an OCS agreement?", "response": "The following documents are required to sign an OCS agreement: ..."}</pre>						</div>
				</div>
				<div class="elementor-element elementor-element-301fbbb elementor-widget elementor-widget-heading" data-id="301fbbb" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Solution design</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-516c119 elementor-widget elementor-widget-text-editor" data-id="516c119" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>At this stage, decisions are made about the technical design of the solution. It’s important to define what type of assistant will best meet the company’s needs—whether it’s a simple chatbot answering questions, a more advanced assistant with access to company knowledge (so-called RAG – Retrieval-Augmented Generation), or an agent capable of independently performing specific tasks such as making bookings, generating reports, or sending emails.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-1b4b071 elementor-widget elementor-widget-text-editor" data-id="1b4b071" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>The next step is selecting the appropriate technologies, including the large language model (LLM) that will power the assistant—such as GPT-4, Claude, Mistral, LLaMA, or Gemini—depending on specific needs and requirements related to privacy, cost, and integration capabilities.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-d9610e4 elementor-widget elementor-widget-text-editor" data-id="d9610e4" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>Finally, it’s worth preparing a list of functions the assistant should perform and planning integration with other systems used in the company—such as the CRM, knowledge base, or email.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-a34770c elementor-widget elementor-widget-heading" data-id="a34770c" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Assistant development and configuration</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-ff744d0 elementor-widget elementor-widget-text-editor" data-id="ff744d0" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>At this stage, both the technical backend and the user-facing part of the assistant (frontend) are developed. This could be, for example, a chat interface on the website, a button that launches the assistant in an application, or a widget integrated with tools like Slack. You can read more about how AI agent integration with the <a href="https://inero-software.com/optimization-of-back-office-processes-with-ai-agent-implementation-a-practical-example/">Slack communication platform can look here &gt;&gt;LINK</a></p>						</div>
				</div>
				<div class="elementor-element elementor-element-3b817d5 elementor-widget elementor-widget-text-editor" data-id="3b817d5" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>In parallel, the selected language model is deployed—via services such as Azure OpenAI, OpenAI API, Anthropic (Claude), Google Vertex AI (Gemini), or locally using open-source models like LLaMA, Mistral, or Mixtral.</p><p> </p><p>If the assistant is meant to use internal company knowledge, a RAG (Retrieval-Augmented Generation) mechanism needs to be configured—enabling it to search and match relevant documents to user queries.</p><p> </p><p>Finally, integrations with other systems—such as CRM, ticketing systems, or email—are implemented, allowing the assistant to meaningfully support the team’s day-to-day work.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-fa67de7 elementor-widget elementor-widget-heading" data-id="fa67de7" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Testing and pilot phase</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-56858f2 elementor-widget elementor-widget-text-editor" data-id="56858f2" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>After implementation, thorough testing of the solution is essential. The first step is functional testing—checking whether the assistant correctly understands user intent, responds in line with company documentation, and handles different types of queries appropriately.</p><p> </p><p>The next phase is testing with end users (UAT – User Acceptance Testing), which helps assess how well the assistant performs in real-world scenarios and whether it meets employees’ expectations.</p><p> </p><p>Based on feedback and observations, iterative improvements are made—such as adjusting responses, adding new documents to the knowledge base, or refining prompts and the agent’s logic. This phase is often repeated several times until a satisfactory level of quality is achieved.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-dd6864e elementor-widget elementor-widget-heading" data-id="dd6864e" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Deployment and maintenance</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-c10b8e9 elementor-widget elementor-widget-text-editor" data-id="c10b8e9" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>After completing the testing phase, the assistant is deployed to the target infrastructure—this may be a public cloud (e.g., Azure, AWS, GCP), on-premise servers, or a hybrid solution, depending on security and availability requirements. More about this is covered later in the article.</p><p> </p><p>It’s also necessary to set up monitoring, which allows you to track things like token usage, query frequency, error rates, and the quality of generated responses. This enables quick issue resolution and cost optimization.</p><p>In daily use, it’s important to keep the data up to date—adding new documents, removing outdated information, and updating the knowledge base the assistant relies on.</p><p> </p><p>Over time, as business needs evolve, it may be worth considering retraining or fine-tuning the model—e.g., every few months—to better align it with the organization’s specific context.</p><p> </p><p>Finally, it’s important to provide technical support and user assistance to ensure the solution is not only technically reliable but also convenient and intuitive for everyday use.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-817acb3 elementor-widget elementor-widget-heading" data-id="817acb3" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Data privacy</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-20711ec elementor-widget elementor-widget-text-editor" data-id="20711ec" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>In the “Deployment and maintenance” section, we discussed the available options for choosing the infrastructure on which the AI agent will be deployed.</p><p>Each solution has its pros and cons. Choosing an on-premise setup gives you full control over the data, but it requires a dedicated machine with specific parameters.</p><p>Another option is using a public cloud service, such as Azure. Microsoft clearly states that data submitted to the Azure OpenAI service is not used to train or improve OpenAI or Microsoft models (<a href="https://learn.microsoft.com/en-us/legal/cognitive-services/openai/data-privacy?tabs=azure-portal">source</a>).</p><p>According to Microsoft, prompts and responses are not shared with other customers or OpenAI. Azure operates in full isolation mode: when using GPT-4 on Azure, no information from your conversations is shared with OpenAI LLC. Microsoft has confirmed this in a Data Processing Addendum (DPA).</p>						</div>
				</div>
				<div class="elementor-element elementor-element-16536f6 elementor-widget elementor-widget-heading" data-id="16536f6" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">AI decision accountability</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-68f238b elementor-widget elementor-widget-text-editor" data-id="68f238b" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>It’s important to remember that formal and legal responsibility for the outcomes of an AI agent’s actions and the data it processes lies with the entity that implemented and oversees the solution—most often.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-104a126 elementor-widget elementor-widget-text-editor" data-id="104a126" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ol><li>the organization (e.g., the company that deployed the assistant),</li><li>the system administrator,</li><li>the individual making decisions based on AI suggestions (e.g., a customer service representative, recruiter, or doctor).</li></ol>						</div>
				</div>
				<div class="elementor-element elementor-element-85f731f elementor-widget elementor-widget-text-editor" data-id="85f731f" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><strong>How to reduce risk?</strong></p>						</div>
				</div>
				<div class="elementor-element elementor-element-6db7698 elementor-widget elementor-widget-text-editor" data-id="6db7698" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ol><li>Human-in-the-loop (HITL) – A human must approve important decisions, while AI only supports the process (e.g., the assistant drafts a response, but a person approves it).</li><li>Clear disclaimers and warnings – The AI should inform users: “I am an AI assistant – please verify my responses before making a decision.”</li><li>Source verification – The AI assistant should, where possible, cite sources for its answers or indicate when it doesn’t know rather than guessing. Using RAG enables precise control over the knowledge base.</li></ol>						</div>
				</div>
				<div class="elementor-element elementor-element-ab8fe88 elementor-widget elementor-widget-heading" data-id="ab8fe88" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Summary</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-32ea263 elementor-widget elementor-widget-text-editor" data-id="32ea263" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><strong>The process of implementing an AI agent must be well-planned and carefully considered. It may seem challenging at first, but with proper preparation, it can deliver long-term benefits. If you need support, feel free to contact us.</strong></p><p><span data-ccp-props="{}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-05552e5 elementor-cta--skin-cover elementor-animated-content elementor-bg-transform elementor-bg-transform-zoom-in elementor-widget elementor-widget-call-to-action" data-id="05552e5" data-element_type="widget" data-widget_type="call-to-action.default">
				<div class="elementor-widget-container">
					<a class="elementor-cta" href="https://inero-software.com/contact-inero-software-rd-software-house/">
					<div class="elementor-cta__bg-wrapper">
				<div class="elementor-cta__bg elementor-bg" style="background-image: url(https://inero-software.com/wp-content/uploads/2025/02/cta-AI2-1030x579.png);" role="img" aria-label="cta AI2"></div>
				<div class="elementor-cta__bg-overlay"></div>
			</div>
							<div class="elementor-cta__content">
				
									<h2 class="elementor-cta__title elementor-cta__content-item elementor-content-item elementor-animated-item--grow">
						AI Agent in Your Company?					</h2>
				
									<div class="elementor-cta__description elementor-cta__content-item elementor-content-item elementor-animated-item--grow">
						Write to us and find out how an AI Agent can support your company.					</div>
				
									<div class="elementor-cta__button-wrapper elementor-cta__content-item elementor-content-item elementor-animated-item--grow">
					<span class="elementor-cta__button elementor-button elementor-size-">
						Contact					</span>
					</div>
							</div>
						</a>
				</div>
				</div>
					</div>
				</div>
				</div>
		<p>Artykuł <a href="https://inero-software.com/how-to-prepare-your-company-for-ai-agent-implementation/">How to Prepare Your Company for AI Agent Implementation</a> pochodzi z serwisu <a href="https://inero-software.com">Inero Software - Software Consulting</a>.</p>
]]></content:encoded>
					
		
		
		<post-id xmlns="com-wordpress:feed-additions:1">7741</post-id>	</item>
		<item>
		<title>Deploying LLMs Locally: A Guide to Ollama and LM Studio</title>
		<link>https://inero-software.com/deploying-llms-locally-a-guide-to-ollama-and-lm-studio/</link>
		
		<dc:creator><![CDATA[Martyna Mul]]></dc:creator>
		<pubDate>Fri, 04 Apr 2025 08:53:42 +0000</pubDate>
				<category><![CDATA[AI]]></category>
		<category><![CDATA[Blog]]></category>
		<category><![CDATA[Company]]></category>
		<category><![CDATA[AI development]]></category>
		<category><![CDATA[AI innovations]]></category>
		<category><![CDATA[api]]></category>
		<category><![CDATA[Artificial Intelligence]]></category>
		<category><![CDATA[CLI Tool]]></category>
		<category><![CDATA[Large Language Model]]></category>
		<category><![CDATA[LLM]]></category>
		<category><![CDATA[LM Studio]]></category>
		<category><![CDATA[Local deployment]]></category>
		<category><![CDATA[Ollama]]></category>
		<guid isPermaLink="false">https://inero-software.com/?p=7692</guid>

					<description><![CDATA[<p>Whether you’re building a custom chatbot, agent, an AI-powered code assistant, or using AI to analyse documents offline, local deployment empowers you to experiment and innovate without relying on external services. </p>
<p>Artykuł <a href="https://inero-software.com/deploying-llms-locally-a-guide-to-ollama-and-lm-studio/">Deploying LLMs Locally: A Guide to Ollama and LM Studio</a> pochodzi z serwisu <a href="https://inero-software.com">Inero Software - Software Consulting</a>.</p>
]]></description>
										<content:encoded><![CDATA[		<div data-elementor-type="wp-post" data-elementor-id="7692" class="elementor elementor-7692" data-elementor-post-type="post">
				<div class="elementor-element elementor-element-139e1f8 e-flex e-con-boxed e-con e-parent" data-id="139e1f8" data-element_type="container">
					<div class="e-con-inner">
				<div class="elementor-element elementor-element-2474df1 elementor-widget elementor-widget-html" data-id="2474df1" data-element_type="widget" data-widget_type="html.default">
				<div class="elementor-widget-container">
			 		</div>
				</div>
				<div class="elementor-element elementor-element-29e8b23 elementor-widget elementor-widget-text-editor" data-id="29e8b23" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h4><span class="TextRun SCXW12802383 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW12802383 BCX0">Local deployment of Large Language Models (LLMs) is becoming increasingly popular among developers, tech enthusiasts, and professionals in industries like insurance and transport. Unlike cloud-based APIs, local LLM deployment offers greater privacy, offline accessibility, and complete control over resource optimization and inference performance.</span></span><span class="EOP SCXW12802383 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></h4>						</div>
				</div>
				<div class="elementor-element elementor-element-d13f5fb elementor-widget elementor-widget-text-editor" data-id="d13f5fb" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW230118114 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW230118114 BCX0">Running models like Llama 2 or Mistral directly on your hardware means your data stays on your machine — ideal for privacy-sensitive tasks such as processing insurance documents or working with proprietary transport data. There are no recurring API costs, and the performance depends solely on your system. Whether </span><span class="NormalTextRun SCXW230118114 BCX0">you&#8217;re</span><span class="NormalTextRun SCXW230118114 BCX0"> building a custom chatbot, </span><span class="NormalTextRun SCXW230118114 BCX0">agent, </span><span class="NormalTextRun SCXW230118114 BCX0">an AI-powered code assistant, or using AI to </span><span class="NormalTextRun SCXW230118114 BCX0">analyse</span><span class="NormalTextRun SCXW230118114 BCX0"> documents offline, local deployment empowers you to experiment and innovate without relying on external services.</span></span><span class="EOP SCXW230118114 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-313a919 elementor-widget elementor-widget-text-editor" data-id="313a919" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW97631897 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW97631897 BCX0">In this guide, </span><span class="NormalTextRun SCXW97631897 BCX0">we&#8217;ll</span><span class="NormalTextRun SCXW97631897 BCX0"> explore two powerful tools that make this possible: </span></span><span class="TextRun SCXW97631897 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SpellingErrorV2Themed SCXW97631897 BCX0"><b>Ollama</b></span></span><span class="TextRun SCXW97631897 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW97631897 BCX0"> and </span></span><span class="TextRun SCXW97631897 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW97631897 BCX0"><b>LM Studio</b></span></span><span class="TextRun SCXW97631897 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW97631897 BCX0">. </span><span class="NormalTextRun SCXW97631897 BCX0">We&#8217;ll</span><span class="NormalTextRun SCXW97631897 BCX0"> walk through installation, usage, and customization, helping you pick the best </span><span class="NormalTextRun SCXW97631897 BCX0">option</span><span class="NormalTextRun SCXW97631897 BCX0"> for your goals.</span></span><span class="EOP SCXW97631897 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}">&nbsp;</span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-66f4910 elementor-widget elementor-widget-heading" data-id="66f4910" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Getting Started with Ollama (CLI Tool) </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-55390e0 elementor-widget elementor-widget-text-editor" data-id="55390e0" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW101755402 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SpellingErrorV2Themed SCXW101755402 BCX0">Ollama</span><span class="NormalTextRun SCXW101755402 BCX0"> is a lightweight, open-source command-line tool for running LLMs locally. It acts as a model manager and runtime, making it easy to download and execute open-source models (like Llama 2, Mistral, </span><span class="NormalTextRun SpellingErrorV2Themed SCXW101755402 BCX0">CodeLlama</span><span class="NormalTextRun SCXW101755402 BCX0">, etc.) on your </span><span class="NormalTextRun SCXW101755402 BCX0">machine.</span> <span class="NormalTextRun SpellingErrorV2Themed SCXW101755402 BCX0">Ollama</span><span class="NormalTextRun SCXW101755402 BCX0"> is available for macOS, Linux, and Windows</span><span class="NormalTextRun SCXW101755402 BCX0">, and it includes a local REST API for integration into applications.</span></span><span class="EOP SCXW101755402 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-f83e139 elementor-widget elementor-widget-text-editor" data-id="f83e139" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW107598507 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW107598507 BCX0">1.<b> Install </b></span><b><span class="NormalTextRun SpellingErrorV2Themed SCXW107598507 BCX0">Ollama</span><span class="NormalTextRun SCXW107598507 BCX0"> on Your System:</span></b></span><span class="TextRun SCXW107598507 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW107598507 BCX0"><b> </b>Download the installer for your platform from the official </span><span class="NormalTextRun SpellingErrorV2Themed SCXW107598507 BCX0">Ollama</span><span class="NormalTextRun SCXW107598507 BCX0"> website or use a package manager.</span></span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-f34ab2b elementor-widget elementor-widget-text-editor" data-id="f34ab2b" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW8978879 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW8978879 BCX0">On Windows, download the </span></span><span class="TextRun SCXW8978879 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW8978879 BCX0"><b>OllamaSetup.exe</b></span></span><span class="TextRun SCXW8978879 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW8978879 BCX0"> from the website and run </span><span class="NormalTextRun SCXW8978879 BCX0">it.</span><span class="NormalTextRun SCXW8978879 BCX0"> On Linux, you can install </span><span class="NormalTextRun SpellingErrorV2Themed SCXW8978879 BCX0">Ollama</span><span class="NormalTextRun SCXW8978879 BCX0"> with one command:</span></span><span class="EOP SCXW8978879 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}">&nbsp;</span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-b668357 elementor-widget elementor-widget-text-editor" data-id="b668357" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<pre><span class="TextRun SCXW8325834 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW8325834 BCX0">curl -</span><span class="NormalTextRun SpellingErrorV2Themed SCXW8325834 BCX0">fsSL</span> </span><a class="Hyperlink SCXW8325834 BCX0" href="https://ollama.com/install.sh" target="_blank" rel="noreferrer noopener"><span class="TextRun Underlined SCXW8325834 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW8325834 BCX0" data-ccp-charstyle="Hyperlink">https://ollama.com/install.sh</span></span></a><span class="TextRun SCXW8325834 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW8325834 BCX0"> | </span><span class="NormalTextRun SpellingErrorV2Themed SCXW8325834 BCX0">sh</span></span><span class="EOP SCXW8325834 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></pre>						</div>
				</div>
				<div class="elementor-element elementor-element-c086d50 elementor-widget elementor-widget-text-editor" data-id="c086d50" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW172550952 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW172550952 BCX0">After installation, open a terminal/command prompt and verify </span><span class="NormalTextRun SCXW172550952 BCX0">it’s</span><span class="NormalTextRun SCXW172550952 BCX0"> installed by checking the version:</span></span><span class="EOP SCXW172550952 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-a98aedb elementor-widget elementor-widget-text-editor" data-id="a98aedb" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<pre><span class="TextRun SCXW230245657 BCX0" lang="EN-GB" style="-webkit-user-drag: none; -webkit-tap-highlight-color: transparent; margin: 0px; padding: 0px; user-select: text; white-space-collapse: preserve; font-size: 11pt; line-height: 19.7625px; font-family: Consolas, Consolas_EmbeddedFont, Consolas_MSFontService, monospace; font-variant-ligatures: none !important;" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SpellingErrorV2Themed SCXW230245657 BCX0" style="-webkit-user-drag: none; -webkit-tap-highlight-color: transparent; margin: 0px; padding: 0px; user-select: text; background-position: 0px 100%; background-repeat: repeat-x; border-bottom: 1px solid transparent;">ollama</span><span class="NormalTextRun SCXW230245657 BCX0" style="-webkit-user-drag: none; -webkit-tap-highlight-color: transparent; margin: 0px; padding: 0px; user-select: text;"> -</span><span class="NormalTextRun SCXW230245657 BCX0" style="-webkit-user-drag: none; -webkit-tap-highlight-color: transparent; margin: 0px; padding: 0px; user-select: text;">-</span><span class="NormalTextRun SCXW230245657 BCX0" style="-webkit-user-drag: none; -webkit-tap-highlight-color: transparent; margin: 0px; padding: 0px; user-select: text;">version</span></span><span class="EOP SCXW230245657 BCX0" style="-webkit-user-drag: none; -webkit-tap-highlight-color: transparent; margin: 0px; padding: 0px; user-select: text; white-space-collapse: preserve; font-size: 11pt; line-height: 19.7625px; font-family: Consolas, Consolas_EmbeddedFont, Consolas_MSFontService, monospace;" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></pre>						</div>
				</div>
				<div class="elementor-element elementor-element-fe7e512 elementor-widget elementor-widget-text-editor" data-id="fe7e512" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW228829587 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW228829587 BCX0">This should display the installed </span><span class="NormalTextRun SpellingErrorV2Themed SCXW228829587 BCX0">Ollama</span><span class="NormalTextRun SCXW228829587 BCX0"> version, confirming </span><span class="NormalTextRun SCXW228829587 BCX0">it’s</span><span class="NormalTextRun SCXW228829587 BCX0"> ready to </span><span class="NormalTextRun ContextualSpellingAndGrammarErrorV2Themed SCXW228829587 BCX0">use,</span><span class="NormalTextRun SCXW228829587 BCX0"> e.g.:</span></span><span class="EOP SCXW228829587 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}">&nbsp;</span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-8f0123b elementor-widget elementor-widget-text-editor" data-id="8f0123b" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<pre><span class="TextRun SCXW19868586 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SpellingErrorV2Themed SCXW19868586 BCX0">ollama</span><span class="NormalTextRun SCXW19868586 BCX0"> version is 0.6.2</span></span><span class="EOP SCXW19868586 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></pre>						</div>
				</div>
				<div class="elementor-element elementor-element-cf0e477 elementor-widget elementor-widget-text-editor" data-id="cf0e477" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW20221182 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW20221182 BCX0">2<b>. Download an LLM Model (&#8220;Pull&#8221; a Model)</b>:</span></span><span class="TextRun SCXW20221182 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"> <span class="NormalTextRun SpellingErrorV2Themed SCXW20221182 BCX0">Ollama</span><span class="NormalTextRun SCXW20221182 BCX0"> has a built-in model library. You can search their </span><span class="NormalTextRun SpellingErrorV2Themed SCXW20221182 BCX0">catalog</span><span class="NormalTextRun SCXW20221182 BCX0"> on the website or simply pull a known model by name. For example, to download the 7B parameter Llama 2 chat model, run:</span></span><span class="EOP SCXW20221182 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}">&nbsp;</span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-abab4bd elementor-widget elementor-widget-text-editor" data-id="abab4bd" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<pre><span class="TextRun SCXW86029186 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SpellingErrorV2Themed SCXW86029186 BCX0">ollama</span><span class="NormalTextRun SCXW86029186 BCX0"> pull llama2:7b-chat</span></span><span class="EOP SCXW86029186 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></pre>						</div>
				</div>
				<div class="elementor-element elementor-element-e31da10 elementor-widget elementor-widget-text-editor" data-id="e31da10" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW158953993 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW158953993 BCX0">This command fetches the model weights to your machine (it may take a while, as models are multiple GBs in </span><span class="NormalTextRun SCXW158953993 BCX0">size)</span><span class="NormalTextRun SCXW158953993 BCX0">. You only need to pull a model once; </span><span class="NormalTextRun SCXW158953993 BCX0">afterward</span> <span class="NormalTextRun SCXW158953993 BCX0">it’s</span><span class="NormalTextRun SCXW158953993 BCX0"> stored locally. You can list all downloaded models with </span><span class="NormalTextRun SpellingErrorV2Themed SCXW158953993 BCX0">ollama</span><span class="NormalTextRun SCXW158953993 BCX0"> list if needed.</span></span><span class="EOP SCXW158953993 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-0fe8c48 elementor-widget elementor-widget-text-editor" data-id="0fe8c48" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><strong><span class="TextRun SCXW87322540 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW87322540 BCX0">3. Run the Model Locally:</span></span></strong><span class="TextRun SCXW87322540 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW87322540 BCX0"> Once downloaded, you can execute the model with the </span><span class="NormalTextRun SpellingErrorV2Themed SCXW87322540 BCX0">ollama</span><span class="NormalTextRun SCXW87322540 BCX0"> run command. This will launch an interactive session where you can enter prompts and get responses. For example:</span></span><span class="EOP SCXW87322540 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-bb58a0a elementor-widget elementor-widget-text-editor" data-id="bb58a0a" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<pre><span class="TextRun SCXW171041342 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SpellingErrorV2Themed SCXW171041342 BCX0">ollama</span><span class="NormalTextRun SCXW171041342 BCX0"> run llama2:7b-chat &gt;&gt;&gt; What is the capital city of Poland?</span></span><span class="EOP SCXW171041342 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></pre>						</div>
				</div>
				<div class="elementor-element elementor-element-c17cc6e elementor-widget elementor-widget-text-editor" data-id="c17cc6e" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW99918251 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW99918251 BCX0">After running the above, </span><span class="NormalTextRun SpellingErrorV2Themed SCXW99918251 BCX0">Ollama</span><span class="NormalTextRun SCXW99918251 BCX0"> will load the </span><span class="NormalTextRun ContextualSpellingAndGrammarErrorV2Themed SCXW99918251 BCX0">model</span><span class="NormalTextRun SCXW99918251 BCX0"> and </span><span class="NormalTextRun SCXW99918251 BCX0">you’ll</span><span class="NormalTextRun SCXW99918251 BCX0"> see an </span></span><span class="TextRun SCXW99918251 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW99918251 BCX0">&gt;&gt;&gt;</span></span><span class="TextRun SCXW99918251 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW99918251 BCX0"> prompt. You can then type your questions or instructions. The model (here Llama 2 7B chat) will generate a response to each prompt. For instance, you might ask “What is the capital of France?” and get an answer like “Paris is the capital of France.” printed in the terminal. Internally, the first run may take a bit to initialize, but </span><span class="NormalTextRun SCXW99918251 BCX0">subsequent</span><span class="NormalTextRun SCXW99918251 BCX0"> prompts are answered interactively. </span></span><span class="TextRun SCXW99918251 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW99918251 BCX0">Tip:</span></span><span class="TextRun SCXW99918251 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW99918251 BCX0"> You can also pass a one-off prompt directly in the command, e.g. </span><span class="NormalTextRun SpellingErrorV2Themed SCXW99918251 BCX0">ollama</span><span class="NormalTextRun SCXW99918251 BCX0"> run llama2:7b </span></span><span class="TextRun SCXW99918251 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW99918251 BCX0">&#8220;<b>What is the capital city of Poland?</b>&#8220;</span></span><span class="TextRun SCXW99918251 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW99918251 BCX0"> will output a single response and return to the </span><span class="NormalTextRun SCXW99918251 BCX0">shell.</span></span><span class="EOP SCXW99918251 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-846e51f elementor-widget elementor-widget-text-editor" data-id="846e51f" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW252478220 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW252478220 BCX0">You can also start </span><span class="NormalTextRun SpellingErrorV2Themed SCXW252478220 BCX0">Ollama</span><span class="NormalTextRun SCXW252478220 BCX0"> as a background server with </span><span class="NormalTextRun SpellingErrorV2Themed SCXW252478220 BCX0">ollama</span><span class="NormalTextRun SCXW252478220 BCX0"> serve. This enables the REST API on localhost:11434, which developers can use to integrate the model into apps via HTTP </span><span class="NormalTextRun SCXW252478220 BCX0">calls.</span><span class="NormalTextRun SCXW252478220 BCX0"> You can ask the model by sending POST request, e.g.:</span></span><span class="EOP SCXW252478220 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-7fa1a27 elementor-widget elementor-widget-text-editor" data-id="7fa1a27" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<pre><span class="TextRun SCXW24036424 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW24036424 BCX0">curl </span></span><a class="Hyperlink SCXW24036424 BCX0" href="http://localhost:11434/api/generate" target="_blank" rel="noreferrer noopener"><span class="TextRun Underlined SCXW24036424 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW24036424 BCX0" data-ccp-charstyle="Hyperlink">http://localhost:11434/api/generate</span></span></a><span class="TextRun SCXW24036424 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW24036424 BCX0"> -d </span></span><span class="TextRun SCXW24036424 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW24036424 BCX0">'{</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW24036424 BCX0"><span class="SCXW24036424 BCX0"> </span><br class="SCXW24036424 BCX0" /></span><span class="TextRun SCXW24036424 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW24036424 BCX0">  "model": "llama2:7b-chat",</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW24036424 BCX0"><span class="SCXW24036424 BCX0"> </span><br class="SCXW24036424 BCX0" /></span><span class="TextRun SCXW24036424 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW24036424 BCX0">  "prompt": "What is the capital city of Poland?"</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW24036424 BCX0"><span class="SCXW24036424 BCX0"> </span><br class="SCXW24036424 BCX0" /></span><span class="TextRun SCXW24036424 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW24036424 BCX0">}'</span></span><span class="EOP SCXW24036424 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></pre>						</div>
				</div>
				<div class="elementor-element elementor-element-77dd7b1 elementor-widget elementor-widget-text-editor" data-id="77dd7b1" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW28772340 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW28772340 BCX0">The API returns newline-separated JSON objects, chunk by chunk, as the model generates the response:</span></span><span class="EOP SCXW28772340 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-943d033 elementor-widget elementor-widget-text-editor" data-id="943d033" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<pre><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">{</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"model"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"llama2:7b-chat"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"</span><span class="NormalTextRun SpellingErrorV2Themed SCXW52386783 BCX0">created_at</span><span class="NormalTextRun SCXW52386783 BCX0">"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"2025-04-02T15:19:17.1569954Z"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"response"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"The"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"done"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">false</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">}</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">{</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"model"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"llama2:7b-chat"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"</span><span class="NormalTextRun SpellingErrorV2Themed SCXW52386783 BCX0">created_at</span><span class="NormalTextRun SCXW52386783 BCX0">"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"2025-04-02T15:19:17.268992Z"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"response"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">" capital"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"done"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">false</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">}</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">{</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"model"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"llama2:7b-chat"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"</span><span class="NormalTextRun SpellingErrorV2Themed SCXW52386783 BCX0">created_at</span><span class="NormalTextRun SCXW52386783 BCX0">"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"2025-04-02T15:19:17.3796491Z"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"response"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">" city"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"done"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">false</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">}</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">...</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">{</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"model"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"llama2:7b-chat"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"</span><span class="NormalTextRun SpellingErrorV2Themed SCXW52386783 BCX0">created_at</span><span class="NormalTextRun SCXW52386783 BCX0">"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"2025-04-02T15:19:21.3106413Z"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"response"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">" Warszawa"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"done"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">false</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">}</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">{</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"model"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"llama2:7b-chat"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"</span><span class="NormalTextRun SpellingErrorV2Themed SCXW52386783 BCX0">created_at</span><span class="NormalTextRun SCXW52386783 BCX0">"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"2025-04-02T15:19:21.4619772Z"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"response"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">")."</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"done"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">false</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">}</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">{</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"model"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"llama2:7b-chat"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"</span><span class="NormalTextRun SpellingErrorV2Themed SCXW52386783 BCX0">created_at</span><span class="NormalTextRun SCXW52386783 BCX0">"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"2025-04-02T15:19:21.6296267Z"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"response"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">""</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"done"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">true</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"</span><span class="NormalTextRun SpellingErrorV2Themed SCXW52386783 BCX0">done_reason</span><span class="NormalTextRun SCXW52386783 BCX0">"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"stop"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"</span><span class="NormalTextRun SpellingErrorV2Themed SCXW52386783 BCX0">total_duration</span><span class="NormalTextRun SCXW52386783 BCX0">"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: 5337417000,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"</span><span class="NormalTextRun SpellingErrorV2Themed SCXW52386783 BCX0">load_duration</span><span class="NormalTextRun SCXW52386783 BCX0">"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: 8625100,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"</span><span class="NormalTextRun SpellingErrorV2Themed SCXW52386783 BCX0">prompt_eval_count</span><span class="NormalTextRun SCXW52386783 BCX0">"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: 28,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"</span><span class="NormalTextRun SpellingErrorV2Themed SCXW52386783 BCX0">prompt_eval_duration</span><span class="NormalTextRun SCXW52386783 BCX0">"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: 854952300,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"</span><span class="NormalTextRun SpellingErrorV2Themed SCXW52386783 BCX0">eval_count</span><span class="NormalTextRun SCXW52386783 BCX0">"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: 15,</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">    </span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">"</span><span class="NormalTextRun SpellingErrorV2Themed SCXW52386783 BCX0">eval_duration</span><span class="NormalTextRun SCXW52386783 BCX0">"</span></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">: 4472807400</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW52386783 BCX0"><span class="SCXW52386783 BCX0"> </span><br class="SCXW52386783 BCX0" /></span><span class="TextRun SCXW52386783 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52386783 BCX0">}</span></span><span class="EOP SCXW52386783 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></pre>						</div>
				</div>
				<div class="elementor-element elementor-element-10d3ffe elementor-widget elementor-widget-text-editor" data-id="10d3ffe" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW26657317 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW26657317 BCX0">If you set stream: </span></span><span class="TextRun SCXW26657317 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW26657317 BCX0">false</span></span><span class="TextRun SCXW26657317 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW26657317 BCX0">, the response is a single JSON object:</span></span><span class="EOP SCXW26657317 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-af79c25 elementor-widget elementor-widget-text-editor" data-id="af79c25" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<pre><span class="TextRun SCXW81302069 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW81302069 BCX0">curl </span></span><a class="Hyperlink SCXW81302069 BCX0" href="http://localhost:11434/api/generate" target="_blank" rel="noreferrer noopener"><span class="TextRun Underlined SCXW81302069 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW81302069 BCX0" data-ccp-charstyle="Hyperlink">http://localhost:11434/api/generate</span></span></a><span class="TextRun SCXW81302069 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW81302069 BCX0"> -d </span></span><span class="TextRun SCXW81302069 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW81302069 BCX0">'{</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW81302069 BCX0"><span class="SCXW81302069 BCX0"> </span><br class="SCXW81302069 BCX0" /></span><span class="TextRun SCXW81302069 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW81302069 BCX0">  "model": "llama2:7b-chat",</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW81302069 BCX0"><span class="SCXW81302069 BCX0"> </span><br class="SCXW81302069 BCX0" /></span><span class="TextRun SCXW81302069 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW81302069 BCX0">  "prompt": "What is the capital city of Poland?",</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW81302069 BCX0"><span class="SCXW81302069 BCX0"> </span><br class="SCXW81302069 BCX0" /></span><span class="TextRun SCXW81302069 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW81302069 BCX0">  "stream": false</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW81302069 BCX0"><span class="SCXW81302069 BCX0"> </span><br class="SCXW81302069 BCX0" /></span><span class="TextRun SCXW81302069 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW81302069 BCX0">}</span></span></pre>						</div>
				</div>
				<div class="elementor-element elementor-element-3d76430 elementor-widget elementor-widget-text-editor" data-id="3d76430" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW62602235 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW62602235 BCX0">You can also set </span><span class="NormalTextRun SCXW62602235 BCX0">a number of</span><span class="NormalTextRun SCXW62602235 BCX0"> model parameters such as </span></span><span class="TextRun SCXW62602235 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW62602235 BCX0">temperature</span></span><span class="TextRun SCXW62602235 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW62602235 BCX0"> by adding field </span></span><span class="TextRun SCXW62602235 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW62602235 BCX0">options</span></span><span class="TextRun SCXW62602235 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW62602235 BCX0">:</span></span><span class="EOP SCXW62602235 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-12fc8b0 elementor-widget elementor-widget-text-editor" data-id="12fc8b0" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<pre><span class="TextRun SCXW121643900 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW121643900 BCX0">curl </span></span><a class="Hyperlink SCXW121643900 BCX0" href="http://localhost:11434/api/generate" target="_blank" rel="noreferrer noopener"><span class="TextRun Underlined SCXW121643900 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW121643900 BCX0" data-ccp-charstyle="Hyperlink">http://localhost:11434/api/generate</span></span></a><span class="TextRun SCXW121643900 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW121643900 BCX0"> -d </span></span><span class="TextRun SCXW121643900 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW121643900 BCX0">'{</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW121643900 BCX0"><span class="SCXW121643900 BCX0"> </span><br class="SCXW121643900 BCX0" /></span><span class="TextRun SCXW121643900 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW121643900 BCX0">  "model": "llama2:7b-chat",</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW121643900 BCX0"><span class="SCXW121643900 BCX0"> </span><br class="SCXW121643900 BCX0" /></span><span class="TextRun SCXW121643900 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW121643900 BCX0">  "prompt": "What is the capital city of Poland?",</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW121643900 BCX0"><span class="SCXW121643900 BCX0"> </span><br class="SCXW121643900 BCX0" /></span><span class="TextRun SCXW121643900 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW121643900 BCX0">  "options": {</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW121643900 BCX0"><span class="SCXW121643900 BCX0"> </span><br class="SCXW121643900 BCX0" /></span> <span class="TextRun SCXW121643900 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW121643900 BCX0">"temperature": 0.2  </span></span><span class="LineBreakBlob BlobObject DragDrop SCXW121643900 BCX0"><span class="SCXW121643900 BCX0"> </span><br class="SCXW121643900 BCX0" /></span><span class="TextRun SCXW121643900 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW121643900 BCX0">  }</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW121643900 BCX0"><span class="SCXW121643900 BCX0"> </span><br class="SCXW121643900 BCX0" /></span><span class="TextRun SCXW121643900 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW121643900 BCX0">  "stream": false</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW121643900 BCX0"><span class="SCXW121643900 BCX0"> </span><br class="SCXW121643900 BCX0" /></span><span class="TextRun SCXW121643900 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW121643900 BCX0">}'</span></span></pre>						</div>
				</div>
				<div class="elementor-element elementor-element-c478ddd elementor-widget elementor-widget-text-editor" data-id="c478ddd" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW13767485 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW13767485 BCX0">4. <b>Customize Models:</b></span></span><span class="TextRun SCXW13767485 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><b> </b><span class="NormalTextRun SpellingErrorV2Themed SCXW13767485 BCX0">Ollama</span><span class="NormalTextRun SCXW13767485 BCX0"> supports a </span><span class="NormalTextRun SpellingErrorV2Themed SCXW13767485 BCX0">Dockerfile</span><span class="NormalTextRun SCXW13767485 BCX0">-like syntax called a </span></span><span class="TextRun SCXW13767485 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SpellingErrorV2Themed SCXW13767485 BCX0"><b>Modelfile</b></span></span><span class="TextRun SCXW13767485 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW13767485 BCX0"><b> </b>to create </span></span><span class="TextRun SCXW13767485 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW13767485 BCX0"><b>custom LLM variants</b></span></span><span class="TextRun SCXW13767485 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW13767485 BCX0">. These let you:</span></span><span class="EOP SCXW13767485 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-dde64e1 elementor-widget elementor-widget-text-editor" data-id="dde64e1" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="9" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1"><span data-contrast="none">Start from an existing model (like </span><span data-contrast="none">llama3</span><span data-contrast="none">)</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="9" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="2" data-aria-level="1"><span data-contrast="none">Add custom system prompts</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="9" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="3" data-aria-level="1"><span data-contrast="none">Inject user-defined data (e.g., instructions, context)</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="9" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="4" data-aria-level="1"><span data-contrast="none">Set model parameters, like temperature</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-9672691 elementor-widget elementor-widget-text-editor" data-id="9672691" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span data-contrast="none">Here is the simple example how you can create your custom assistant for processing insurance documents:</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-b3b173f elementor-widget elementor-widget-text-editor" data-id="b3b173f" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<pre><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">FROM llama2:7b-chat</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">PARAMETER temperature 0.7</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">SYSTEM </span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">"""</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">You are an assistant that extracts insurance-related information from a given input text.</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">You must extract and return only the following fields:</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">- policy_number</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">- insurance_period</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">- insured (company or person name)</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">- nip (tax identification number)</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">- address (of the insured)</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">Return the output as a **clean JSON object** -- not as a string, not inside quotes, and without any commentary. If a field is missing, use "</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">Not found</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">".</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">Example output format:</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">{</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">  "</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SpellingErrorV2Themed SCXW168916518 BCX0">policy_number</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">": "</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">...</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">",</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">  "</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SpellingErrorV2Themed SCXW168916518 BCX0">insurance_period</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">": "</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">...</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">",</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">  "</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">insured</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">": "</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">...</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">",</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">  "</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">nip</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">": "</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">...</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">",</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">  "</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">address</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">": "</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">...</span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">"</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">}</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">"""</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">TEMPLATE </span></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">"""</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">{{ .</span><span class="NormalTextRun ContextualSpellingAndGrammarErrorV2Themed SCXW168916518 BCX0">System }</span><span class="NormalTextRun SCXW168916518 BCX0">}</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">Input:</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">{{ .</span><span class="NormalTextRun ContextualSpellingAndGrammarErrorV2Themed SCXW168916518 BCX0">Prompt }</span><span class="NormalTextRun SCXW168916518 BCX0">}</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">Response:</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW168916518 BCX0"><span class="SCXW168916518 BCX0"> </span><br class="SCXW168916518 BCX0" /></span><span class="TextRun SCXW168916518 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW168916518 BCX0">"""</span></span><span class="EOP SCXW168916518 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span>Lorem ipsum dolor sit amet, consectetur adipiscing elit. Ut elit tellus, luctus nec ullamcorper mattis, pulvinar dapibus leo.</pre>						</div>
				</div>
				<div class="elementor-element elementor-element-70f4001 elementor-widget elementor-widget-text-editor" data-id="70f4001" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="NormalTextRun SCXW237655292 BCX0">To use </span><span class="NormalTextRun SpellingErrorV2Themed SCXW237655292 BCX0">Makefile</span><span class="NormalTextRun SCXW237655292 BCX0">, save it in a directory, e.g. insurance-</span><span class="NormalTextRun SCXW237655292 BCX0">a</span><span class="NormalTextRun SCXW237655292 BCX0">ssistant</span><span class="NormalTextRun SCXW237655292 BCX0"> and create the custom model:</span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-5d4fca1 elementor-widget elementor-widget-text-editor" data-id="5d4fca1" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<pre><span class="TextRun SCXW150813743 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SpellingErrorV2Themed SCXW150813743 BCX0">ollama</span><span class="NormalTextRun SCXW150813743 BCX0"> create insurance-assistant -f insurance-</span><span class="NormalTextRun SpellingErrorV2Themed SCXW150813743 BCX0">assitant</span><span class="NormalTextRun SCXW150813743 BCX0">/</span><span class="NormalTextRun SpellingErrorV2Themed SCXW150813743 BCX0">Modelfile</span></span><span class="EOP SCXW150813743 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></pre>						</div>
				</div>
				<div class="elementor-element elementor-element-3cfba04 elementor-widget elementor-widget-text-editor" data-id="3cfba04" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span data-contrast="none">Then, you can use your model by providing the proper model name in a request:</span> </p>						</div>
				</div>
				<div class="elementor-element elementor-element-607dc80 elementor-widget elementor-widget-text-editor" data-id="607dc80" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<pre><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span><span data-contrast="none">curl </span><a href="http://localhost:11434/api/generate"><span data-contrast="none">http://localhost:11434/api/generate</span></a><span data-contrast="none"> -d </span><span data-contrast="none">'{</span> <br /><span data-contrast="none">  "model": "insurance-extractor",</span> <br /><span data-contrast="none">  "prompt": "",</span> <br /><span data-contrast="none">  "stream": false</span> <br /><span data-contrast="none">}'</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></pre>						</div>
				</div>
				<div class="elementor-element elementor-element-bc5221c elementor-widget elementor-widget-text-editor" data-id="bc5221c" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW210001513 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SpellingErrorV2Themed SCXW210001513 BCX0">Ollama</span><span class="NormalTextRun SCXW210001513 BCX0"> is purely CLI-based, so </span><span class="NormalTextRun SCXW210001513 BCX0">there’s</span><span class="NormalTextRun SCXW210001513 BCX0"> no graphical interface. However, this makes it </span></span><span class="TextRun SCXW210001513 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW210001513 BCX0">powerful for automation</span></span><span class="TextRun SCXW210001513 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW210001513 BCX0"> – you can pipe input/output, log responses to files, or call the </span><span class="NormalTextRun SpellingErrorV2Themed SCXW210001513 BCX0">Ollama</span><span class="NormalTextRun SCXW210001513 BCX0"> API from code. In summary, with just a few commands, you have a privacy-protecting LLM running on your PC, ready to answer questions or </span><span class="NormalTextRun SCXW210001513 BCX0">assist</span><span class="NormalTextRun SCXW210001513 BCX0"> in coding, all </span></span><span class="TextRun SCXW210001513 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW210001513 BCX0">without any internet connection needed</span></span><span class="TextRun SCXW210001513 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW210001513 BCX0">.</span></span><span class="EOP SCXW210001513 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-ce97082 elementor-widget elementor-widget-heading" data-id="ce97082" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Getting Started with LM Studio (Desktop App) </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-f911779 elementor-widget elementor-widget-image" data-id="f911779" data-element_type="widget" data-widget_type="image.default">
				<div class="elementor-widget-container">
													<img loading="lazy" decoding="async" data-attachment-id="7711" data-permalink="https://inero-software.com/deploying-llms-locally-a-guide-to-ollama-and-lm-studio/llm1/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/04/LLM1.png" data-orig-size="1920,1080" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="LLM1" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/04/LLM1-300x169.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/04/LLM1-1030x579.png" tabindex="0" role="button" width="1030" height="579" src="https://inero-software.com/wp-content/uploads/2025/04/LLM1-1030x579.png" class="attachment-large size-large wp-image-7711" alt="" srcset="https://inero-software.com/wp-content/uploads/2025/04/LLM1-1030x579.png 1030w, https://inero-software.com/wp-content/uploads/2025/04/LLM1-300x169.png 300w, https://inero-software.com/wp-content/uploads/2025/04/LLM1-768x432.png 768w, https://inero-software.com/wp-content/uploads/2025/04/LLM1-1536x864.png 1536w, https://inero-software.com/wp-content/uploads/2025/04/LLM1-533x300.png 533w, https://inero-software.com/wp-content/uploads/2025/04/LLM1.png 1920w" sizes="(max-width: 1030px) 100vw, 1030px" data-attachment-id="7711" data-permalink="https://inero-software.com/deploying-llms-locally-a-guide-to-ollama-and-lm-studio/llm1/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/04/LLM1.png" data-orig-size="1920,1080" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="LLM1" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/04/LLM1-300x169.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/04/LLM1-1030x579.png" role="button" />													</div>
				</div>
				<div class="elementor-element elementor-element-14c3b4c elementor-widget elementor-widget-text-editor" data-id="14c3b4c" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><b><span data-contrast="none">LM Studio</span></b><span data-contrast="none"> is a user-friendly desktop application that lets you </span><b><span data-contrast="none">download and run local LLMs via a graphical interface</span></b><span data-contrast="none">. It’s cross-platform (Windows, macOS, Linux) and ideal for beginners who prefer not to use the command line. With LM Studio, you can chat with models in a nice UI, manage model downloads, and even run a local server to use the model in other apps.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p><p><span data-ccp-props="{}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-623f7d7 elementor-widget elementor-widget-text-editor" data-id="623f7d7" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW122283343 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW122283343 BCX0"><b>1. Install and Launch LM Studio:</b></span></span><span class="TextRun SCXW122283343 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW122283343 BCX0"> Download the installer for your OS from the LM Studio website and install it. After installation, launch the </span></span><span class="TextRun SCXW122283343 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW122283343 BCX0"><b>LM Studio</b></span></span><span class="TextRun SCXW122283343 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW122283343 BCX0"><b> app</b>. The first time you open </span><span class="NormalTextRun ContextualSpellingAndGrammarErrorV2Themed SCXW122283343 BCX0">it,</span> <span class="NormalTextRun SCXW122283343 BCX0">you’ll</span><span class="NormalTextRun SCXW122283343 BCX0"> be prompted to download an AI model. You can choose from a list of popular open-source models. For example, you might select a smaller model like “Mistral 7B” or an instruction-tuned Llama2 variant to start.</span></span><span class="EOP SCXW122283343 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-eef6a33 elementor-widget elementor-widget-text-editor" data-id="eef6a33" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><strong><span class="TextRun SCXW160100961 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW160100961 BCX0">2. Run Your First Chat:</span></span></strong><span class="TextRun SCXW160100961 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW160100961 BCX0"> Once the model is downloaded, LM Studio will load it into memory. You can then start a new chat session in the app. The interface typically has a text box where you can enter your prompt or question, and the model’s response will appear in the chat window. Simply type a query (for example: </span></span><span class="TextRun SCXW160100961 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW160100961 BCX0">“What’s the capital of France?”</span></span><span class="TextRun SCXW160100961 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW160100961 BCX0"> or </span></span><span class="TextRun SCXW160100961 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW160100961 BCX0">“Explain quantum physics simply.”</span></span><span class="TextRun SCXW160100961 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW160100961 BCX0">) and hit Enter. The AI’s answer will be displayed as the “Assistant” reply in the chat. LM Studio conveniently shows the generation metrics:</span></span><span class="EOP SCXW160100961 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-e83ff6c elementor-widget elementor-widget-text-editor" data-id="e83ff6c" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="10" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1"><span data-contrast="none">number of input and output tokens,</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="10" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="2" data-aria-level="1"><span data-contrast="none">tokens per second &#8211; you can see how fast the model is generating text,</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="10" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="3" data-aria-level="1"><span data-contrast="none">context occupancy,</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="10" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="4" data-aria-level="1"><span data-contrast="none">system resources usage (RAM and processor usage).</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-4c50be9 elementor-widget elementor-widget-text-editor" data-id="4c50be9" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><strong><span class="TextRun SCXW47407587 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW47407587 BCX0">3. Explore the Features:</span></span></strong><span class="TextRun SCXW47407587 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW47407587 BCX0"> The LM Studio GUI provides </span><span class="NormalTextRun SCXW47407587 BCX0">additional</span><span class="NormalTextRun SCXW47407587 BCX0"> features accessible to both beginners and advanced users:</span></span><span class="EOP SCXW47407587 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-0bc4155 elementor-widget elementor-widget-text-editor" data-id="0bc4155" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li><strong><span class="TextRun SCXW37213095 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW37213095 BCX0">Model Library:</span></span></strong><span class="TextRun SCXW37213095 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW37213095 BCX0"> A “Discover Models” or </span><span class="NormalTextRun SpellingErrorV2Themed SCXW37213095 BCX0">catalog</span><span class="NormalTextRun SCXW37213095 BCX0"> section where you can download new models or update existing ones. </span><span class="NormalTextRun SCXW37213095 BCX0">You’re</span><span class="NormalTextRun SCXW37213095 BCX0"> not limited to one model – you can have multiple models stored and switch between them. This means you have a wide selection: from small 3B parameter models for speed, up to 70B models if your system can handle them.</span></span><span class="EOP SCXW37213095 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-c3af6d0 elementor-widget elementor-widget-text-editor" data-id="c3af6d0" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li><strong><span class="TextRun SCXW224090495 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW224090495 BCX0">Chat Interface:</span></span></strong><span class="TextRun SCXW224090495 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW224090495 BCX0"> The main chat screen (as shown above) is where you interact with the model. Each new prompt you enter is answered by the model in a conversational format. You can have multi-turn dialogues, just like chatting with ChatGPT. </span><span class="NormalTextRun SCXW224090495 BCX0">There’s</span><span class="NormalTextRun SCXW224090495 BCX0"> no need to manage a prompt history manually – the app keeps the conversation context.</span></span><span class="EOP SCXW224090495 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-fcf03f1 elementor-widget elementor-widget-text-editor" data-id="fcf03f1" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li><strong><span class="TextRun SCXW52102321 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52102321 BCX0">Advanced Settings:</span></span></strong><span class="TextRun SCXW52102321 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52102321 BCX0"> On the side panel, LM Studio offers configuration knobs for those who want more control. You can set a </span></span><strong><span class="TextRun SCXW52102321 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52102321 BCX0">system prompt</span></span></strong><span class="TextRun SCXW52102321 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52102321 BCX0"> (a role or instruction that guides the AI’s </span><span class="NormalTextRun SpellingErrorV2Themed SCXW52102321 BCX0">behavior</span><span class="NormalTextRun SCXW52102321 BCX0"> globally), adjust generation settings like </span></span><span class="TextRun SCXW52102321 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52102321 BCX0">temperature</span></span><span class="TextRun SCXW52102321 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52102321 BCX0"> (creativity vs. consistency) and </span></span><span class="TextRun SCXW52102321 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52102321 BCX0">top-p</span></span><span class="TextRun SCXW52102321 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52102321 BCX0"> or </span></span><span class="TextRun SCXW52102321 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52102321 BCX0">top-k</span></span><span class="TextRun SCXW52102321 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW52102321 BCX0"> sampling for controlling randomness, max tokens for responses, etc. These options let you fine-tune how the model responds without writing any code. For instance, you could set a system instruction like “You are a helpful coding assistant,</span><span class="NormalTextRun SCXW52102321 BCX0">”.</span><span class="NormalTextRun SCXW52102321 BCX0"> This is a friendly way to customize </span><span class="NormalTextRun SpellingErrorV2Themed SCXW52102321 BCX0">behavior</span><span class="NormalTextRun SCXW52102321 BCX0">, though </span><span class="NormalTextRun SCXW52102321 BCX0">it’s</span><span class="NormalTextRun SCXW52102321 BCX0"> not as extensive as programmatic control in a CLI tool.</span></span><span class="EOP SCXW52102321 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-5378615 elementor-widget elementor-widget-image" data-id="5378615" data-element_type="widget" data-widget_type="image.default">
				<div class="elementor-widget-container">
													<img loading="lazy" decoding="async" data-attachment-id="7710" data-permalink="https://inero-software.com/deploying-llms-locally-a-guide-to-ollama-and-lm-studio/llm2/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/04/LLM2.png" data-orig-size="1920,1080" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="LLM2" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/04/LLM2-300x169.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/04/LLM2-1030x579.png" tabindex="0" role="button" width="1030" height="579" src="https://inero-software.com/wp-content/uploads/2025/04/LLM2-1030x579.png" class="attachment-large size-large wp-image-7710" alt="" srcset="https://inero-software.com/wp-content/uploads/2025/04/LLM2-1030x579.png 1030w, https://inero-software.com/wp-content/uploads/2025/04/LLM2-300x169.png 300w, https://inero-software.com/wp-content/uploads/2025/04/LLM2-768x432.png 768w, https://inero-software.com/wp-content/uploads/2025/04/LLM2-1536x864.png 1536w, https://inero-software.com/wp-content/uploads/2025/04/LLM2-533x300.png 533w, https://inero-software.com/wp-content/uploads/2025/04/LLM2.png 1920w" sizes="(max-width: 1030px) 100vw, 1030px" data-attachment-id="7710" data-permalink="https://inero-software.com/deploying-llms-locally-a-guide-to-ollama-and-lm-studio/llm2/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/04/LLM2.png" data-orig-size="1920,1080" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="LLM2" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/04/LLM2-300x169.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/04/LLM2-1030x579.png" role="button" />													</div>
				</div>
				<div class="elementor-element elementor-element-8d32129 elementor-widget elementor-widget-text-editor" data-id="8d32129" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h6><span class="NormalTextRun SCXW87331471 BCX0">Advanced settings – </span><span class="NormalTextRun SCXW87331471 BCX0">simple </span><span class="NormalTextRun SCXW87331471 BCX0">example of </span><span class="NormalTextRun SCXW87331471 BCX0">AI assistant</span><span class="NormalTextRun SCXW87331471 BCX0"> for processing insurance documents</span></h6>						</div>
				</div>
				<div class="elementor-element elementor-element-88a1e0d elementor-widget elementor-widget-text-editor" data-id="88a1e0d" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li><span class="TextRun SCXW87021791 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW87021791 BCX0"><strong>Local API Server</strong>:</span></span><span class="TextRun SCXW87021791 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW87021791 BCX0"> For developers, LM Studio includes a “Local LLM Server” mode. Just switch to Developer tab, choose the model, and toggle Start button. It enables an API endpoint on localhost that mimics the OpenAI API, allowing other programs to send requests to your local </span><span class="NormalTextRun ContextualSpellingAndGrammarErrorV2Themed SCXW87021791 BCX0">model.</span><span class="NormalTextRun SCXW87021791 BCX0"> This is powerful if you want to integrate the local LLM into your own applications (for example, connecting a chatbot UI or using the model for AI features in an IDE) while still </span><span class="NormalTextRun SCXW87021791 BCX0">benefiting</span><span class="NormalTextRun SCXW87021791 BCX0"> from privacy and not relying on external services.</span></span><span class="EOP SCXW87021791 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-369df09 elementor-widget elementor-widget-image" data-id="369df09" data-element_type="widget" data-widget_type="image.default">
				<div class="elementor-widget-container">
													<img loading="lazy" decoding="async" data-attachment-id="7709" data-permalink="https://inero-software.com/deploying-llms-locally-a-guide-to-ollama-and-lm-studio/llm3/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/04/LLM3.png" data-orig-size="1920,1080" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="LLM3" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/04/LLM3-300x169.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/04/LLM3-1030x579.png" tabindex="0" role="button" width="1030" height="579" src="https://inero-software.com/wp-content/uploads/2025/04/LLM3-1030x579.png" class="attachment-large size-large wp-image-7709" alt="" srcset="https://inero-software.com/wp-content/uploads/2025/04/LLM3-1030x579.png 1030w, https://inero-software.com/wp-content/uploads/2025/04/LLM3-300x169.png 300w, https://inero-software.com/wp-content/uploads/2025/04/LLM3-768x432.png 768w, https://inero-software.com/wp-content/uploads/2025/04/LLM3-1536x864.png 1536w, https://inero-software.com/wp-content/uploads/2025/04/LLM3-533x300.png 533w, https://inero-software.com/wp-content/uploads/2025/04/LLM3.png 1920w" sizes="(max-width: 1030px) 100vw, 1030px" data-attachment-id="7709" data-permalink="https://inero-software.com/deploying-llms-locally-a-guide-to-ollama-and-lm-studio/llm3/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/04/LLM3.png" data-orig-size="1920,1080" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="LLM3" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/04/LLM3-300x169.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/04/LLM3-1030x579.png" role="button" />													</div>
				</div>
				<div class="elementor-element elementor-element-5937737 elementor-widget elementor-widget-text-editor" data-id="5937737" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h6><span class="TextRun SCXW123659257 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW123659257 BCX0">Developer tab</span><span class="NormalTextRun SCXW123659257 BCX0"> &#8211;</span><span class="NormalTextRun SCXW123659257 BCX0"> you can </span><span class="NormalTextRun SCXW123659257 BCX0">enable</span><span class="NormalTextRun SCXW123659257 BCX0"> local LLM server</span><span class="NormalTextRun SCXW123659257 BCX0"> hosting your customized LLM</span><span class="NormalTextRun SCXW123659257 BCX0">.</span></span><span class="EOP SCXW123659257 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559685&quot;:720,&quot;335559738&quot;:220,&quot;335559739&quot;:220}"> </span></h6>						</div>
				</div>
				<div class="elementor-element elementor-element-06d2cee elementor-widget elementor-widget-text-editor" data-id="06d2cee" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW66765914 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW66765914 BCX0">Using LM Studio is as simple as </span><span class="NormalTextRun SpellingErrorV2Themed SCXW66765914 BCX0">chatGPT</span><span class="NormalTextRun SCXW66765914 BCX0"> – type and get answers – but entirely running on your hardware. The </span></span><span class="TextRun SCXW66765914 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW66765914 BCX0">user-friendly interface</span></span><span class="TextRun SCXW66765914 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW66765914 BCX0"> lowers the barrier to </span><span class="NormalTextRun SCXW66765914 BCX0">entry, since</span><span class="NormalTextRun SCXW66765914 BCX0"> you </span><span class="NormalTextRun SCXW66765914 BCX0">don’t</span><span class="NormalTextRun SCXW66765914 BCX0"> need to use the terminal or remember commands. You get immediate, interactive AI responses, with buttons and menus to manage everything.</span></span><span class="EOP SCXW66765914 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-b60b847 elementor-widget elementor-widget-heading" data-id="b60b847" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Ollama vs. LM Studio: Tool Comparison </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-2d19913 elementor-widget elementor-widget-text-editor" data-id="2d19913" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW228077632 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW228077632 BCX0">Both </span><span class="NormalTextRun SpellingErrorV2Themed SCXW228077632 BCX0">Ollama</span><span class="NormalTextRun SCXW228077632 BCX0"> and LM Studio let you run LLMs locally, but they cater to slightly different audiences and use-cases. </span><span class="NormalTextRun SCXW228077632 BCX0">Here’s</span><span class="NormalTextRun SCXW228077632 BCX0"> a comparison of key aspects to help you understand their differences:</span></span><span class="EOP SCXW228077632 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-872db63 elementor-widget elementor-widget-text-editor" data-id="872db63" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li><span class="TextRun SCXW183865909 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW183865909 BCX0"><b>Interface &amp; Ease of Use</b>:</span></span> <span class="TextRun SCXW183865909 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW183865909 BCX0">LM Studio</span></span><span class="TextRun SCXW183865909 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW183865909 BCX0"> provides a polished </span></span><span class="TextRun SCXW183865909 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW183865909 BCX0">graphical user interface</span></span><span class="TextRun SCXW183865909 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW183865909 BCX0">, which makes it extremely approachable for beginners. </span><span class="NormalTextRun SCXW183865909 BCX0">It’s</span><span class="NormalTextRun SCXW183865909 BCX0"> point-and-click with an integrated chat window, so no technical knowledge is </span><span class="NormalTextRun SCXW183865909 BCX0">required</span><span class="NormalTextRun SCXW183865909 BCX0"> to get </span><span class="NormalTextRun SCXW183865909 BCX0">started.</span> </span><span class="TextRun SCXW183865909 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SpellingErrorV2Themed SCXW183865909 BCX0">Ollama</span></span><span class="TextRun SCXW183865909 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW183865909 BCX0">, on the other hand, is a </span></span><span class="TextRun SCXW183865909 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW183865909 BCX0">command-line interface (CLI)</span></span><span class="TextRun SCXW183865909 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW183865909 BCX0"> tool (with an optional REST API). It offers a lot of power and </span><span class="NormalTextRun SCXW183865909 BCX0">flexibility but</span><span class="NormalTextRun SCXW183865909 BCX0"> does require comfort with the terminal to use </span><span class="NormalTextRun SCXW183865909 BCX0">effectively.</span><span class="NormalTextRun SCXW183865909 BCX0"> Beginners might find </span><span class="NormalTextRun SpellingErrorV2Themed SCXW183865909 BCX0">Ollama’s</span><span class="NormalTextRun SCXW183865909 BCX0"> learning curve steeper, </span><span class="NormalTextRun SCXW183865909 BCX0">whereas</span><span class="NormalTextRun SCXW183865909 BCX0"> LM Studio feels more plug-and-play.</span></span><span class="EOP SCXW183865909 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-4f4ccfd elementor-widget elementor-widget-text-editor" data-id="4f4ccfd" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul>
<li style="list-style-type: none;">
<ul>
<li><span class="TextRun SCXW89912573 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW89912573 BCX0"><b>Supported Models:</b></span></span><span class="TextRun SCXW89912573 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW89912573 BCX0"> Both tools support a wide range of open-source LLMs. LM Studio can load any model in GGUF format (the standard for llama.cpp), meaning models like Llama 2 (7B, 13B, 70B), Mistral, Vicuna, Alpaca, </span><span class="NormalTextRun SpellingErrorV2Themed SCXW89912573 BCX0">CodeLlama</span><span class="NormalTextRun SCXW89912573 BCX0">, etc., </span><span class="NormalTextRun SCXW89912573 BCX0">as long as</span><span class="NormalTextRun SCXW89912573 BCX0"> you have the hardware for them&nbsp;</span></span><span class="EOP SCXW89912573 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}">&nbsp;</span></li>
</ul>
</li>
</ul>						</div>
				</div>
				<div class="elementor-element elementor-element-8a420f5 elementor-widget elementor-widget-text-editor" data-id="8a420f5" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul>
<li style="list-style-type: none;">
<ul>
<li><span class="TextRun SCXW72859417 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW72859417 BCX0"><b>Use Cases Suited</b>:</span></span><span class="TextRun SCXW72859417 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW72859417 BCX0"> Because of the above differences, </span></span><span class="TextRun SCXW72859417 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW72859417 BCX0"><b>LM Studio is excellent for users who want a personal ChatGPT-like assistant on their PC with minimal setup</b></span></span><span class="TextRun SCXW72859417 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW72859417 BCX0">. </span><span class="NormalTextRun SCXW72859417 BCX0">It’s</span><span class="NormalTextRun SCXW72859417 BCX0"> great for interactive Q&amp;A, brainstorming, or casual use – you launch it when you need it, type queries, get answers. </span></span><span class="TextRun SCXW72859417 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><b><span class="NormalTextRun SpellingErrorV2Themed SCXW72859417 BCX0">Ollama</span><span class="NormalTextRun SCXW72859417 BCX0"> is ideal for developers or those who want to incorporate LLMs into projects or workflows</span></b></span><span class="TextRun SCXW72859417 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW72859417 BCX0"><b>.</b> If you plan to experiment with prompts in scripts, fine-tune model </span><span class="NormalTextRun SpellingErrorV2Themed SCXW72859417 BCX0">behaviors</span><span class="NormalTextRun SCXW72859417 BCX0">, or build an app (like a chatbot, a coding assistant integration, etc.) that calls a local model, </span><span class="NormalTextRun SpellingErrorV2Themed SCXW72859417 BCX0">Ollama’s</span><span class="NormalTextRun SCXW72859417 BCX0"> CLI and API give you that flexibility.</span></span><span class="EOP SCXW72859417 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}">&nbsp;</span></li>
</ul>
</li>
</ul>						</div>
				</div>
				<div class="elementor-element elementor-element-b4240ce elementor-widget elementor-widget-heading" data-id="b4240ce" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Conclusion and Recommendations </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-a417a13 elementor-widget elementor-widget-text-editor" data-id="a417a13" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW229049291 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW229049291 BCX0">Deploying LLMs locally has </span><span class="NormalTextRun SCXW229049291 BCX0">opened up</span><span class="NormalTextRun SCXW229049291 BCX0"> a world of possibilities for developers and enthusiasts. </span><span class="NormalTextRun SCXW229049291 BCX0">We’ve</span><span class="NormalTextRun SCXW229049291 BCX0"> discussed </span></span><span class="TextRun SCXW229049291 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SpellingErrorV2Themed SCXW229049291 BCX0"><b>Ollama</b></span></span><span class="TextRun SCXW229049291 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW229049291 BCX0"> and </span></span><span class="TextRun SCXW229049291 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW229049291 BCX0"><b>LM Studio</b></span></span><span class="TextRun SCXW229049291 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW229049291 BCX0"><b> </b>– two excellent tools that make local AI accessible. To recap some guidance on choosing between them:</span></span><span class="EOP SCXW229049291 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}">&nbsp;</span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-93b9fb0 elementor-widget elementor-widget-text-editor" data-id="93b9fb0" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li><span class="TextRun SCXW193410475 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW193410475 BCX0"><b>Choose LM Studio</b></span></span><span class="TextRun SCXW193410475 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW193410475 BCX0"> if you want a </span></span><span class="TextRun SCXW193410475 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW193410475 BCX0"><b>plug-and-play AI chat experience</b></span></span><span class="TextRun SCXW193410475 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW193410475 BCX0"> with a friendly GUI. </span><span class="NormalTextRun SCXW193410475 BCX0">It’s</span><span class="NormalTextRun SCXW193410475 BCX0"> perfect for beginners or those who prefer not to tinker with command lines. You get quick setup, easy model downloads, and a nice chat interface for </span><span class="NormalTextRun SCXW193410475 BCX0">interactions.</span><span class="NormalTextRun SCXW193410475 BCX0"> This might be best for someone who just wants an “offline ChatGPT” for personal use, note-taking, or idea generation without fussing over configurations. </span><span class="NormalTextRun SCXW193410475 BCX0">It’s</span><span class="NormalTextRun SCXW193410475 BCX0"> also a convenient way to demo LLM capabilities to non-technical users (since it feels like a normal app).</span></span><span class="EOP SCXW193410475 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-dcecadd elementor-widget elementor-widget-text-editor" data-id="dcecadd" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li><span class="TextRun SCXW242147822 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><b><span class="NormalTextRun SCXW242147822 BCX0">Choose </span><span class="NormalTextRun SpellingErrorV2Themed SCXW242147822 BCX0">Ollama</span></b></span><span class="TextRun SCXW242147822 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW242147822 BCX0"><b> </b>if you want </span></span><span class="TextRun SCXW242147822 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW242147822 BCX0">more<b> control, automation, or integration</b></span></span><span class="TextRun SCXW242147822 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW242147822 BCX0"><b>.</b> Developers and power users will appreciate its flexibility – you can script it, run it headless on a server, integrate the local LLM into your own apps via the API, and fine-tune model </span><span class="NormalTextRun SpellingErrorV2Themed SCXW242147822 BCX0">behavior</span><span class="NormalTextRun SCXW242147822 BCX0"> with </span><span class="NormalTextRun SpellingErrorV2Themed SCXW242147822 BCX0">Modelfiles</span><span class="NormalTextRun SCXW242147822 BCX0"> . If </span><span class="NormalTextRun SCXW242147822 BCX0">you’re</span><span class="NormalTextRun SCXW242147822 BCX0"> comfortable with a terminal and want to customize how the AI works (beyond what a GUI allows), </span><span class="NormalTextRun SpellingErrorV2Themed SCXW242147822 BCX0">Ollama</span><span class="NormalTextRun SCXW242147822 BCX0"> is a better fit. </span><span class="NormalTextRun SCXW242147822 BCX0">It’s</span><span class="NormalTextRun SCXW242147822 BCX0"> also lightweight if you intend to run background AI services continuously.</span></span><span class="EOP SCXW242147822 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:220,&quot;335559739&quot;:220}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-cd8dc50 elementor-widget elementor-widget-text-editor" data-id="cd8dc50" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW16460031 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW16460031 BCX0">Finally, remember that the </span></span><span class="TextRun SCXW16460031 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW16460031 BCX0">LLM itself</span></span><span class="TextRun SCXW16460031 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW16460031 BCX0"> (the model you choose) is as important as the tool. Spend time finding a model that suits your task – whether </span><span class="NormalTextRun SCXW16460031 BCX0">it’s</span><span class="NormalTextRun SCXW16460031 BCX0"> a concise summarizer or a creative storyteller – and fits your hardware. Both </span><span class="NormalTextRun SpellingErrorV2Themed SCXW16460031 BCX0">Ollama</span><span class="NormalTextRun SCXW16460031 BCX0"> and LM Studio make it easy to swap models, so </span><span class="NormalTextRun SCXW16460031 BCX0">you’re</span><span class="NormalTextRun SCXW16460031 BCX0"> not locked in. The ecosystem of open-source models is growing rapidly, which means running a powerful AI on your own device is only getting easier and more common.</span></span><span class="EOP SCXW16460031 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-5a3b149 elementor-widget elementor-widget-text-editor" data-id="5a3b149" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW154420196 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW154420196 BCX0">In summary</span></span><span class="TextRun SCXW154420196 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW154420196 BCX0">, deploying LLMs locally with these tools gives you the best of both worlds: AI capabilities </span><span class="NormalTextRun SCXW154420196 BCX0">similar to</span><span class="NormalTextRun SCXW154420196 BCX0"> cloud services, but with </span></span><span class="TextRun SCXW154420196 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW154420196 BCX0"><b>privacy, control, and zero ongoing cost</b></span></span><span class="TextRun SCXW154420196 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="none"><span class="NormalTextRun SCXW154420196 BCX0"><b>.</b> Whether you go with a command-line power tool like </span><span class="NormalTextRun SpellingErrorV2Themed SCXW154420196 BCX0">Ollama</span><span class="NormalTextRun SCXW154420196 BCX0"> or a user-friendly app like LM Studio, </span><span class="NormalTextRun SCXW154420196 BCX0">you’ll</span><span class="NormalTextRun SCXW154420196 BCX0"> be joining the </span><span class="NormalTextRun SCXW154420196 BCX0">cutting edge</span><span class="NormalTextRun SCXW154420196 BCX0"> of local AI development. Happy </span><span class="NormalTextRun ContextualSpellingAndGrammarErrorV2Themed SCXW154420196 BCX0">experimenting, and</span><span class="NormalTextRun SCXW154420196 BCX0"> enjoy your new personal AI running right on your machine!</span></span><span class="EOP SCXW154420196 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}">&nbsp;</span></p>						</div>
				</div>
					</div>
				</div>
				</div>
		<p>Artykuł <a href="https://inero-software.com/deploying-llms-locally-a-guide-to-ollama-and-lm-studio/">Deploying LLMs Locally: A Guide to Ollama and LM Studio</a> pochodzi z serwisu <a href="https://inero-software.com">Inero Software - Software Consulting</a>.</p>
]]></content:encoded>
					
		
		
		<post-id xmlns="com-wordpress:feed-additions:1">7692</post-id>	</item>
		<item>
		<title>OpenAI vs. DeepSeek: A Technical Comparison Using Unified APIs</title>
		<link>https://inero-software.com/openai-vs-deepseek-a-technical-comparison-using-unified-apis/</link>
		
		<dc:creator><![CDATA[Martyna Mul]]></dc:creator>
		<pubDate>Fri, 14 Mar 2025 13:35:14 +0000</pubDate>
				<category><![CDATA[AI]]></category>
		<category><![CDATA[Blog]]></category>
		<category><![CDATA[Company]]></category>
		<category><![CDATA[AI Algorithms]]></category>
		<category><![CDATA[DeepSeek]]></category>
		<category><![CDATA[OpenAI]]></category>
		<guid isPermaLink="false">https://inero-software.com/?p=7564</guid>

					<description><![CDATA[<p> In this post, we conduct a comparative analysis of three popular LLMs—OpenAI’s GPT based models: 4o-mini and o3-mini, and open-source DeepSeek R1—to evaluate their effectiveness in reading and analyzing statistical data from large PDFs. </p>
<p>Artykuł <a href="https://inero-software.com/openai-vs-deepseek-a-technical-comparison-using-unified-apis/">OpenAI vs. DeepSeek: A Technical Comparison Using Unified APIs</a> pochodzi z serwisu <a href="https://inero-software.com">Inero Software - Software Consulting</a>.</p>
]]></description>
										<content:encoded><![CDATA[		<div data-elementor-type="wp-post" data-elementor-id="7564" class="elementor elementor-7564" data-elementor-post-type="post">
				<div class="elementor-element elementor-element-4c59976 e-flex e-con-boxed e-con e-parent" data-id="4c59976" data-element_type="container">
					<div class="e-con-inner">
				<div class="elementor-element elementor-element-5cf6ead elementor-widget elementor-widget-html" data-id="5cf6ead" data-element_type="widget" data-widget_type="html.default">
				<div class="elementor-widget-container">
			 		</div>
				</div>
				<div class="elementor-element elementor-element-a037070 elementor-widget elementor-widget-text-editor" data-id="a037070" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h4><span class="TextRun SCXW23850730 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW23850730 BCX0">Large language models (LLMs) are increasingly used to </span><span class="NormalTextRun SpellingErrorV2Themed SCXW23850730 BCX0">analyze</span><span class="NormalTextRun SCXW23850730 BCX0"> and extract insights from extensive documents, including lengthy statistical reports in PDF format. However, not all models perform equally when processing large files, especially those exceeding 50 pages. In this post, we conduct a comparative analysis of three popular LLMs—OpenAI</span><span class="NormalTextRun SCXW23850730 BCX0">’s GPT based models:</span><span class="NormalTextRun SCXW23850730 BCX0"> 4o-mini</span><span class="NormalTextRun SCXW23850730 BCX0"> and</span><span class="NormalTextRun SCXW23850730 BCX0"> o3-mini, and open-source </span><span class="NormalTextRun SpellingErrorV2Themed SCXW23850730 BCX0">DeepSeek</span><span class="NormalTextRun SCXW23850730 BCX0"> R1—to evaluate their effectiveness in reading and </span><span class="NormalTextRun SpellingErrorV2Themed SCXW23850730 BCX0">analyzing</span><span class="NormalTextRun SCXW23850730 BCX0"> statistical data from large PDFs. Our assessment focuses on three key factors: accuracy, response time, and cost estimation for each model.</span></span><span class="EOP SCXW23850730 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}">&nbsp;</span></h4>						</div>
				</div>
				<div class="elementor-element elementor-element-237cac6 elementor-widget elementor-widget-text-editor" data-id="237cac6" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW241218521 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW241218521 BCX0">To ensure a fair comparison, we utilized </span><span class="NormalTextRun SpellingErrorV2Themed SCXW241218521 BCX0">LiteLLM</span><span class="NormalTextRun SCXW241218521 BCX0">, a unified API that simplifies multi-model </span><span class="NormalTextRun SCXW241218521 BCX0">LLM </span><span class="NormalTextRun SCXW241218521 BCX0">benchmarking. By standardizing interactions across different LLM providers, </span><span class="NormalTextRun SpellingErrorV2Themed SCXW241218521 BCX0">LiteLLM</span><span class="NormalTextRun SCXW241218521 BCX0"> allowed us to focus on </span><span class="NormalTextRun SCXW241218521 BCX0">evaluating LLM performance</span><span class="NormalTextRun SCXW241218521 BCX0"> metrics rather than implementation differences.</span></span><span class="EOP SCXW241218521 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-53a2380 elementor-widget elementor-widget-heading" data-id="53a2380" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">A Unified API Approach </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-f569e31 elementor-widget elementor-widget-text-editor" data-id="f569e31" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW97117196 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW97117196 BCX0">Comparing open-source and proprietary LLMs from different providers can be challenging due to their varying APIs. To standardize our testing, we utilized </span><span class="NormalTextRun SpellingErrorV2Themed SCXW97117196 BCX0">LiteLLM</span><span class="NormalTextRun SCXW97117196 BCX0">, a library that provides a consistent interface for interacting with multiple LLMs. This allowed for easier switching between models and </span><span class="NormalTextRun SCXW97117196 BCX0">facilitated</span><span class="NormalTextRun SCXW97117196 BCX0"> a more objective </span></span><span class="TextRun SCXW97117196 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW97117196 BCX0">AI model comparison</span></span><span class="TextRun SCXW97117196 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW97117196 BCX0">. Here is how easy it is to switch models using </span><span class="NormalTextRun SpellingErrorV2Themed SCXW97117196 BCX0">LiteLLM’s</span><span class="NormalTextRun SCXW97117196 BCX0"> unified API:</span></span><span class="EOP SCXW97117196 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
					</div>
				</div>
		<div class="elementor-element elementor-element-277031f e-flex e-con-boxed e-con e-parent" data-id="277031f" data-element_type="container">
					<div class="e-con-inner">
				<div class="elementor-element elementor-element-66b9211 elementor-widget elementor-widget-text-editor" data-id="66b9211" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<pre><span class="TextRun SCXW177913088 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW177913088 BCX0">import litellm</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW177913088 BCX0"><span class="SCXW177913088 BCX0"> </span><br class="SCXW177913088 BCX0" /></span><span class="LineBreakBlob BlobObject DragDrop SCXW177913088 BCX0"><span class="SCXW177913088 BCX0"> </span><br class="SCXW177913088 BCX0" /></span><span class="TextRun SCXW177913088 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW177913088 BCX0"># To use </span><span class="NormalTextRun SpellingErrorV2Themed SCXW177913088 BCX0">openai</span><span class="NormalTextRun SCXW177913088 BCX0">.</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW177913088 BCX0"><span class="SCXW177913088 BCX0"> </span><br class="SCXW177913088 BCX0" /></span><span class="TextRun SCXW177913088 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW177913088 BCX0">response = </span><span class="NormalTextRun SpellingErrorV2Themed SCXW177913088 BCX0">litellm.completion</span><span class="NormalTextRun SCXW177913088 BCX0">(model="</span><span class="NormalTextRun SCXW177913088 BCX0">o3-mini</span><span class="NormalTextRun SCXW177913088 BCX0">", messages</span><span class="NormalTextRun ContextualSpellingAndGrammarErrorV2Themed SCXW177913088 BCX0">=[</span><span class="NormalTextRun SCXW177913088 BCX0">{"content": "Hello", "role": "user"}])</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW177913088 BCX0"><span class="SCXW177913088 BCX0"> </span><br class="SCXW177913088 BCX0" /></span><span class="LineBreakBlob BlobObject DragDrop SCXW177913088 BCX0"><span class="SCXW177913088 BCX0"> </span><br class="SCXW177913088 BCX0" /></span><span class="TextRun SCXW177913088 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW177913088 BCX0"># To use </span><span class="NormalTextRun SpellingErrorV2Themed SCXW177913088 BCX0">deepseek</span><span class="NormalTextRun SCXW177913088 BCX0">.</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW177913088 BCX0"><span class="SCXW177913088 BCX0"> </span><br class="SCXW177913088 BCX0" /></span><span class="TextRun SCXW177913088 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW177913088 BCX0">response = </span><span class="NormalTextRun SpellingErrorV2Themed SCXW177913088 BCX0">litellm.completion</span><span class="NormalTextRun SCXW177913088 BCX0">(model="</span><span class="NormalTextRun SpellingErrorV2Themed SCXW177913088 BCX0">deepseek</span><span class="NormalTextRun SCXW177913088 BCX0">/</span><span class="NormalTextRun SpellingErrorV2Themed SCXW177913088 BCX0">deepseek</span><span class="NormalTextRun SCXW177913088 BCX0">-</span><span class="NormalTextRun SCXW177913088 BCX0">reasoner</span><span class="NormalTextRun SCXW177913088 BCX0">", messages</span><span class="NormalTextRun ContextualSpellingAndGrammarErrorV2Themed SCXW177913088 BCX0">=[</span><span class="NormalTextRun SCXW177913088 BCX0">{"content": "Hello", "role": "user"}])</span></span><span class="LineBreakBlob BlobObject DragDrop SCXW177913088 BCX0"><span class="SCXW177913088 BCX0"> </span><br class="SCXW177913088 BCX0" /></span></pre>						</div>
				</div>
				<div class="elementor-element elementor-element-ad9012a elementor-widget elementor-widget-text-editor" data-id="ad9012a" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW231103637 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW231103637 BCX0">This simplified approach helped us compare models without worrying about implementation complexities.</span></span><span class="EOP SCXW231103637 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;201341983&quot;:0,&quot;335551550&quot;:1,&quot;335551620&quot;:1,&quot;335559685&quot;:0,&quot;335559737&quot;:0,&quot;335559738&quot;:0,&quot;335559739&quot;:160,&quot;335559740&quot;:279}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-bdf2fca elementor-widget elementor-widget-heading" data-id="bdf2fca" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">DeepSeek vs. OpenAI – model overview </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-2a9d55a elementor-widget elementor-widget-text-editor" data-id="2a9d55a" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW72884465 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW72884465 BCX0">Before diving into the</span><span class="NormalTextRun SCXW72884465 BCX0"> AI model</span><span class="NormalTextRun SCXW72884465 BCX0"> benchmarking results, </span><span class="NormalTextRun SCXW72884465 BCX0">let&#8217;s</span><span class="NormalTextRun SCXW72884465 BCX0"> define key concepts and introduce the core specifications of the tested models.</span></span><span class="EOP SCXW72884465 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-3070cc7 elementor-widget elementor-widget-text-editor" data-id="3070cc7" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW16640192 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW16640192 BCX0">One of the most important parameters to consider</span><span class="NormalTextRun SCXW16640192 BCX0"> in LLM benchmarking</span><span class="NormalTextRun SCXW16640192 BCX0"> is the </span></span><span class="TextRun SCXW16640192 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW16640192 BCX0">context window</span></span><span class="TextRun SCXW16640192 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW16640192 BCX0">—the maximum input size a model can process at once. This is measured in tokens, which represent chunks of text rather than individual words. A larger context window allows the model to handle more extensive documents in a single request, which is particularly important when working with long statistical reports.</span></span><span class="EOP SCXW16640192 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-d7ab0b3 elementor-widget elementor-widget-text-editor" data-id="d7ab0b3" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW22985181 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW22985181 BCX0">The pricing for LLMs is typically based on token usage, which can vary depending on the type of tokens being processed. There are </span><span class="NormalTextRun SCXW22985181 BCX0">generally three</span><span class="NormalTextRun SCXW22985181 BCX0"> types of tokens involved in LLM pricing:</span></span><span class="EOP SCXW22985181 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-65a6290 elementor-widget elementor-widget-text-editor" data-id="65a6290" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ol><li data-leveltext="%1." data-font="Aptos" data-listid="12" data-list-defn-props="{&quot;335551671&quot;:1,&quot;335552541&quot;:0,&quot;335559683&quot;:0,&quot;335559684&quot;:-1,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769242&quot;:[65533,0,46],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;%1.&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1"><b><span data-contrast="auto">Input Tokens</span></b><span data-contrast="auto">: These are the tokens representing the user’s input, such as the text or prompt sent to the model for processing. The cost of input tokens is charged based on the number of tokens provided by the user in each request.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li><li><b><span data-contrast="auto">Cached Input Tokens</span></b><span data-contrast="auto">: Some models offer a caching mechanism, where previously used inputs are stored and reused in subsequent requests, reducing the need for reprocessing. This is often charged at a lower rate than fresh input tokens, as the model does not need to process them again from scratch.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li><li><b><span data-contrast="auto">Output Tokens</span></b><span data-contrast="auto">: These tokens represent the text or response generated by the model. Output tokens are charged based on the amount of text the model generates in response to the user&#8217;s input.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ol>						</div>
				</div>
				<div class="elementor-element elementor-element-d9daaed elementor-widget elementor-widget-text-editor" data-id="d9daaed" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW245291604 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW245291604 BCX0">The models selected for this comparison are among the latest releases from the past </span><span class="NormalTextRun SCXW245291604 BCX0">several</span><span class="NormalTextRun SCXW245291604 BCX0"> months. While they differ in pricing and capabilities, we aim to assess whether these differences translate into measurable performance variations. Below is a breakdown of the key characteristics of </span></span><span class="TextRun SCXW245291604 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW245291604 BCX0">DeepSeek-R1</span></span><span class="TextRun SCXW245291604 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW245291604 BCX0">, </span></span><span class="TextRun SCXW245291604 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW245291604 BCX0">OpenAI 4o-mini</span></span><span class="TextRun SCXW245291604 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW245291604 BCX0">, and </span></span><span class="TextRun SCXW245291604 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW245291604 BCX0">OpenAI o3-mini</span></span><span class="TextRun SCXW245291604 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW245291604 BCX0">:</span></span><span class="EOP SCXW245291604 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-c83f80c elementor-widget elementor-widget-html" data-id="c83f80c" data-element_type="widget" data-widget_type="html.default">
				<div class="elementor-widget-container">
			<style>
    table {
        width: 100%;
        border-collapse: collapse;
        font-family: 'Roboto', sans-serif;
        font-weight: 300;
        font-size: 14px;
        color: #1C244B;
    }
    th, td {
        border: 1px solid #ddd;
        padding: 8px;
        text-align: left;
    }
    th {
        background-color: #f4f4f4;
        color: #1C244B;
    }
    tr:nth-child(even) {
        background-color: #f9f9f9;
    }
</style>

<table>
    <thead>
        <tr>
            <th></th>
            <th>DeepSeek-R1</th>
            <th>OpenAI 4o-mini</th>
            <th>OpenAI o3-mini</th>
        </tr>
    </thead>
    <tbody>
        <tr>
            <td><strong>Context Window</strong></td>
            <td>128,000 tokens</td>
            <td>128,000 tokens (with a maximum output of 16,384 tokens)</td>
            <td>200,000 tokens (with a maximum output of 100,000 tokens)</td>
        </tr>
        <tr>
            <td><strong>Release Date</strong></td>
            <td>January 2025</td>
            <td>July 2024</td>
            <td>January 2025</td>
        </tr>
        <tr>
            <td><strong>Pricing (per 1 million tokens)</strong></td>
            <td>Input: $0.55<br>Cached input: $0.14<br>Output: $2.19</td>
            <td>Input: $0.15<br>Cached input: $0.075<br>Output: $0.60</td>
            <td>Input: $1.10<br>Cached input: $0.55<br>Output: $4.40</td>
        </tr>
        <tr>
            <td><strong>Input Formats</strong></td>
            <td>Text</td>
            <td>Text, Images (including PNG, JPEG, GIF, WEBP)</td>
            <td>Text</td>
        </tr>
        <tr>
            <td><strong>Output Formats</strong></td>
            <td>Text</td>
            <td>Text</td>
            <td>Text</td>
        </tr>
    </tbody>
</table>

<!-- Link to Google Fonts -->
<link href="https://fonts.googleapis.com/css2?family=Roboto:wght@300&display=swap" rel="stylesheet">
		</div>
				</div>
				<div class="elementor-element elementor-element-fb0549b elementor-widget elementor-widget-heading" data-id="fb0549b" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">PDF file used for testing </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-898fdb5 elementor-widget elementor-widget-text-editor" data-id="898fdb5" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW165493897 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW165493897 BCX0">The document </span><span class="NormalTextRun SCXW165493897 BCX0">used for testing</span><span class="NormalTextRun SCXW165493897 BCX0"> is </span><span class="NormalTextRun SCXW165493897 BCX0">composed of several chapters</span><span class="NormalTextRun SCXW165493897 BCX0"> of</span><span class="NormalTextRun SCXW165493897 BCX0"> report on the Polish and worldwide maritime economy in 20</span><span class="NormalTextRun SCXW165493897 BCX0">17-2020</span><span class="NormalTextRun SCXW165493897 BCX0">. The report</span><span class="NormalTextRun SCXW165493897 BCX0"> is </span></span><span class="TextRun SCXW165493897 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW165493897 BCX0">50 pages long</span></span><span class="TextRun SCXW165493897 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"> <span class="NormalTextRun ContextualSpellingAndGrammarErrorV2Themed SCXW165493897 BCX0">and </span><span class="NormalTextRun ContextualSpellingAndGrammarErrorV2Themed SCXW165493897 BCX0"> includes</span> <span class="NormalTextRun SCXW165493897 BCX0">various </span><span class="NormalTextRun SCXW165493897 BCX0">statistics and analysis of cargo traffic, shipping, shipbuilding, and other maritime industries. The data in the file is formatted in tables and text. Most of the data is presented in tables, with </span><span class="NormalTextRun SCXW165493897 BCX0">additional</span><span class="NormalTextRun SCXW165493897 BCX0"> explanations and summaries in the surrounding text.</span><span class="NormalTextRun SCXW165493897 BCX0"> Example pages of the document used for testing:</span></span><span class="EOP SCXW165493897 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-cf84d20 elementor-widget elementor-widget-image" data-id="cf84d20" data-element_type="widget" data-widget_type="image.default">
				<div class="elementor-widget-container">
													<img loading="lazy" decoding="async" data-attachment-id="7573" data-permalink="https://inero-software.com/openai-vs-deepseek-a-technical-comparison-using-unified-apis/grafika-14032025/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/03/grafika-14032025.png" data-orig-size="2000,1414" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="grafika 14032025" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/03/grafika-14032025-300x212.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/03/grafika-14032025-1030x728.png" tabindex="0" role="button" width="1030" height="728" src="https://inero-software.com/wp-content/uploads/2025/03/grafika-14032025-1030x728.png" class="attachment-large size-large wp-image-7573" alt="" srcset="https://inero-software.com/wp-content/uploads/2025/03/grafika-14032025-1030x728.png 1030w, https://inero-software.com/wp-content/uploads/2025/03/grafika-14032025-300x212.png 300w, https://inero-software.com/wp-content/uploads/2025/03/grafika-14032025-768x543.png 768w, https://inero-software.com/wp-content/uploads/2025/03/grafika-14032025-1536x1086.png 1536w, https://inero-software.com/wp-content/uploads/2025/03/grafika-14032025-424x300.png 424w, https://inero-software.com/wp-content/uploads/2025/03/grafika-14032025.png 2000w" sizes="(max-width: 1030px) 100vw, 1030px" data-attachment-id="7573" data-permalink="https://inero-software.com/openai-vs-deepseek-a-technical-comparison-using-unified-apis/grafika-14032025/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/03/grafika-14032025.png" data-orig-size="2000,1414" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="grafika 14032025" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/03/grafika-14032025-300x212.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/03/grafika-14032025-1030x728.png" role="button" />													</div>
				</div>
				<div class="elementor-element elementor-element-e46d19d elementor-widget elementor-widget-heading" data-id="e46d19d" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Testing Methodology </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-1ba1d08 elementor-widget elementor-widget-text-editor" data-id="1ba1d08" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW149358593 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW149358593 BCX0">We conducted a series of tests using the following maritime economy-themed </span><span class="NormalTextRun SCXW149358593 BCX0">prompts</span><span class="NormalTextRun SCXW149358593 BCX0"> and </span><span class="NormalTextRun SCXW149358593 BCX0">a </span><span class="NormalTextRun SCXW149358593 BCX0">PDF file providing context information. </span><span class="NormalTextRun SCXW149358593 BCX0">Here are example prompts</span> <span class="NormalTextRun SCXW149358593 BCX0">regarding</span><span class="NormalTextRun SCXW149358593 BCX0"> information included in the PDF</span><span class="NormalTextRun SCXW149358593 BCX0">:</span></span><span class="EOP SCXW149358593 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-4228b97 elementor-widget elementor-widget-text-editor" data-id="4228b97" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="6" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1"><span data-contrast="auto">Summarize the key economic findings from a maritime report.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="6" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="2" data-aria-level="1"><span data-contrast="auto">What is the total cargo turnover of Polish sea ports in 2020?</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="6" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="3" data-aria-level="1"><span data-contrast="auto">What are the main cargo types handled by Polish sea ports?</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="6" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="4" data-aria-level="1"><span data-contrast="auto">Which countries are the main trading partners of Poland in seaborne trade?</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="6" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="5" data-aria-level="1"><span data-contrast="auto">What is the average age of ships in the Polish maritime transport fleet?</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="6" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="6" data-aria-level="1"><span data-contrast="auto">What are the key economic indicators for the Polish shipbuilding industry?</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-26bc5cf elementor-widget elementor-widget-text-editor" data-id="26bc5cf" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW219856678 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW219856678 BCX0">As mentioned before, w</span><span class="NormalTextRun SCXW219856678 BCX0">e compared the following models:</span></span><span class="EOP SCXW219856678 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-890abbd elementor-widget elementor-widget-text-editor" data-id="890abbd" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="7" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1"><span data-contrast="auto">OpenAI&#8217;s 4o-mini</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="7" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="2" data-aria-level="1"><span data-contrast="auto">OpenAI&#8217;s </span><span data-contrast="auto">o3-mini</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="7" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="3" data-aria-level="1"><span data-contrast="auto">DeepSeek&#8217;s </span><span data-contrast="auto">deepseek-resoner (R1)</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-153e657 elementor-widget elementor-widget-text-editor" data-id="153e657" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW236391729 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW236391729 BCX0">We measured the following metrics:</span></span><span class="EOP SCXW236391729 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-6ca549e elementor-widget elementor-widget-text-editor" data-id="6ca549e" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="8" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1"><b><span data-contrast="auto">Inference Time</span></b><span data-contrast="auto"> – This refers to the time it takes for the model to generate a response after receiving a prompt. A lower inference time means faster responses, which is crucial for real-time applications and large-scale document processing.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="8" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="2" data-aria-level="1"><b><span data-contrast="auto">Token Usage</span></b><span data-contrast="auto"> – LLMs process and generate text in units called </span><i><span data-contrast="auto">tokens</span></i><span data-contrast="auto">. A token can be a word, part of a word, or even a punctuation mark. The total token usage includes both input tokens (the user’s query or document) and output tokens (the model’s generated response). The more tokens used, the higher the cost of the request.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="8" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="3" data-aria-level="1"><b><span data-contrast="auto">Response Cost</span></b><span data-contrast="auto"> – This is calculated as </span><b><span data-contrast="auto">token usage × model pricing</span></b><span data-contrast="auto"> (per 1,000 or 1,000,000 tokens, depending on the provider). Since different models have different pricing structures, comparing response costs helps determine which model is more cost-effective for large-scale use cases.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-e807a52 elementor-widget elementor-widget-heading" data-id="e807a52" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Test Results </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-b36a1c6 elementor-widget elementor-widget-text-editor" data-id="b36a1c6" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW217432411 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW217432411 BCX0">Here are the summarized results from our tests</span><span class="NormalTextRun SCXW217432411 BCX0"> (each test was repeated several times)</span><span class="NormalTextRun SCXW217432411 BCX0">:</span></span><span class="EOP SCXW217432411 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
				<div class="elementor-element elementor-element-f26f255 elementor-widget elementor-widget-html" data-id="f26f255" data-element_type="widget" data-widget_type="html.default">
				<div class="elementor-widget-container">
			<style>
    table {
        width: 100%;
        border-collapse: collapse;
        font-family: 'Roboto', sans-serif;
        font-weight: 300;
        font-size: 14px;
        color: #1C244B;
    }
    th, td {
        border: 1px solid #ddd;
        padding: 8px;
        text-align: left;
    }
    th {
        background-color: #f4f4f4;
        color: #1C244B;
    }
    tr:nth-child(even) {
        background-color: #f9f9f9;
    }
</style>

<table>
    <thead>
        <tr>
            <th>Model</th>
            <th>Average Inference Time (s)</th>
            <th>Average Response Cost ($)</th>
            <th>Average Input Tokens</th>
            <th>Average Output Tokens</th>
        </tr>
    </thead>
    <tbody>
        <tr>
            <td><strong>DeepSeek R1</strong></td>
            <td>57.2</td>
            <td>0.0039</td>
            <td>63961.7</td>
            <td>751.6</td>
        </tr>
        <tr>
            <td><strong>o3-mini</strong></td>
            <td>13.8</td>
            <td>0.0755</td>
            <td>63251.5</td>
            <td>1162.5</td>
        </tr>
        <tr>
            <td><strong>4o-mini</strong></td>
            <td>9.5</td>
            <td>0.0511</td>
            <td>62538.0</td>
            <td>1046.5</td>
        </tr>
    </tbody>
</table>

<!-- Link to Google Fonts -->
<link href="https://fonts.googleapis.com/css2?family=Roboto:wght@300&display=swap" rel="stylesheet">
		</div>
				</div>
				<div class="elementor-element elementor-element-65630f9 elementor-widget elementor-widget-heading" data-id="65630f9" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Key Observations</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-703de17 elementor-widget elementor-widget-text-editor" data-id="703de17" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="9" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="1" data-aria-level="1"><b><span data-contrast="auto">Inference Time</span></b><span data-contrast="auto">: DeepSeek consistently demonstrated longer inference times compared to both OpenAI models. This could be a significant factor for applications that prioritize fast processing.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="9" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="2" data-aria-level="1"><b><span data-contrast="auto">Response Cost</span></b><span data-contrast="auto">: DeepSeek showed a competitive advantage in terms of cost, particularly for output tokens. Despite the longer inference time, DeepSeek’s overall cost per request remains lower than OpenAI o3-mini and 4o-mini. The lower response cost of DeepSeek can be attributed to its caching mechanism, which reduces the need to reprocess input data. Most of the input content, particularly the PDF file&#8217;s contents, was cached, leading to significant savings in processing costs. This caching system allowed DeepSeek to handle repeated queries more efficiently, making it a cost-effective option for processing large documents.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="9" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="3" data-aria-level="1"><b><span data-contrast="auto">Output Variability</span></b><span data-contrast="auto">: The models varied in style and the level of detail in their responses. This is important depending on the context and user requirements (e.g., high-level summaries vs. detailed analysis).</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></li></ul></li></ul><ul><li style="list-style-type: none;"><ul><li data-leveltext="" data-font="Symbol" data-listid="9" data-list-defn-props="{&quot;335552541&quot;:1,&quot;335559683&quot;:0,&quot;335559684&quot;:-2,&quot;335559685&quot;:720,&quot;335559991&quot;:360,&quot;469769226&quot;:&quot;Symbol&quot;,&quot;469769242&quot;:[8226],&quot;469777803&quot;:&quot;left&quot;,&quot;469777804&quot;:&quot;&quot;,&quot;469777815&quot;:&quot;hybridMultilevel&quot;}" aria-setsize="-1" data-aria-posinset="4" data-aria-level="1"><b><span data-contrast="auto">LiteLLM API</span></b><span data-contrast="auto">: LiteLLM made it extremely easy to track cost, token usage, and response time directly from the API responses, enabling a straightforward comparison between models.</span><span data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335559738&quot;:0,&quot;335559739&quot;:0}"> </span></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-f56bc1c elementor-widget elementor-widget-heading" data-id="f56bc1c" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">Conclusion </h3>		</div>
				</div>
				<div class="elementor-element elementor-element-abbecc5 elementor-widget elementor-widget-text-editor" data-id="abbecc5" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0">Our tests highlight the advantages of using unified APIs for </span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0">LLM benchmarking</span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0">. </span><span class="NormalTextRun SpellingErrorV2Themed SCXW28694121 BCX0">LiteLLM</span><span class="NormalTextRun SCXW28694121 BCX0"> significantly simplified the process, allowing us to focus on </span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0">LLM efficiency assessment</span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0"> and </span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0">evaluating AI language models</span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0">. While </span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SpellingErrorV2Themed SCXW28694121 BCX0">DeepSeek</span><span class="NormalTextRun SCXW28694121 BCX0"> R1</span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0"> demonstrated </span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0">competitive cost-effectiveness</span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0">, particularly due to its caching mechanism, it was by far the </span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0">slowest model</span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0"> in our tests, with an average inference time of </span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0">57.2 seconds</span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0">. In contrast, </span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0">OpenAI o3-mini</span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0"> and </span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0">4o-mini</span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0"> provided significantly </span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0">faster response times</span></span><span class="TextRun SCXW28694121 BCX0" lang="EN-GB" xml:lang="EN-GB" data-contrast="auto"><span class="NormalTextRun SCXW28694121 BCX0">, making them more suitable for real-time applications.</span></span><span class="EOP TrackedChange SCXW28694121 BCX0" data-ccp-props="{&quot;134233117&quot;:false,&quot;134233118&quot;:false,&quot;335551550&quot;:0,&quot;335551620&quot;:0,&quot;335559738&quot;:240,&quot;335559739&quot;:240}"> </span></p>						</div>
				</div>
					</div>
				</div>
				</div>
		<p>Artykuł <a href="https://inero-software.com/openai-vs-deepseek-a-technical-comparison-using-unified-apis/">OpenAI vs. DeepSeek: A Technical Comparison Using Unified APIs</a> pochodzi z serwisu <a href="https://inero-software.com">Inero Software - Software Consulting</a>.</p>
]]></content:encoded>
					
		
		
		<post-id xmlns="com-wordpress:feed-additions:1">7564</post-id>	</item>
		<item>
		<title>Meet Your Personal AI Agent: A Case Study for a Freight Forwarding Company</title>
		<link>https://inero-software.com/meet-your-personal-ai-agent-a-case-study-for-a-freight-forwarding-company/</link>
		
		<dc:creator><![CDATA[Marta Kuprasz]]></dc:creator>
		<pubDate>Fri, 21 Feb 2025 11:27:19 +0000</pubDate>
				<category><![CDATA[AI]]></category>
		<category><![CDATA[Blog]]></category>
		<category><![CDATA[Company]]></category>
		<category><![CDATA[SOLUTIONS]]></category>
		<category><![CDATA[AGENT]]></category>
		<category><![CDATA[AI development]]></category>
		<category><![CDATA[AI innovations]]></category>
		<category><![CDATA[BusinessProcessesOptimization]]></category>
		<category><![CDATA[Case study]]></category>
		<category><![CDATA[Gemini]]></category>
		<category><![CDATA[Google]]></category>
		<category><![CDATA[Machine Learning]]></category>
		<guid isPermaLink="false">https://inero-software.com/?p=7341</guid>

					<description><![CDATA[<p>AI-driven tools are becoming increasingly prevalent across various industries, streamlining processes from simple graphic design and translations to advanced document, email, and database analysis. In this article, we will present a practical business application of an AI assistant in action. AI Agents have a wide range of applications, and their&#8230;</p>
<p>Artykuł <a href="https://inero-software.com/meet-your-personal-ai-agent-a-case-study-for-a-freight-forwarding-company/">Meet Your Personal AI Agent: A Case Study for a Freight Forwarding Company</a> pochodzi z serwisu <a href="https://inero-software.com">Inero Software - Software Consulting</a>.</p>
]]></description>
										<content:encoded><![CDATA[		<div data-elementor-type="wp-post" data-elementor-id="7341" class="elementor elementor-7341" data-elementor-post-type="post">
				<div class="elementor-element elementor-element-c1e7efe e-flex e-con-boxed e-con e-parent" data-id="c1e7efe" data-element_type="container">
					<div class="e-con-inner">
				<div class="elementor-element elementor-element-a609c1d elementor-widget elementor-widget-html" data-id="a609c1d" data-element_type="widget" data-widget_type="html.default">
				<div class="elementor-widget-container">
			 		</div>
				</div>
				<div class="elementor-element elementor-element-ff753e4 elementor-widget elementor-widget-text-editor" data-id="ff753e4" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h5>AI-driven tools are becoming increasingly prevalent across various industries, streamlining processes from simple graphic design and translations to advanced document, email, and database analysis. In this article, we will present a practical business application of an AI assistant in action.</h5>						</div>
				</div>
				<div class="elementor-element elementor-element-ee85ecd elementor-widget elementor-widget-text-editor" data-id="ee85ecd" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>AI Agents have a wide range of applications, and their full potential is still being discovered. The main advantages of AI-powered assistants include:</p>						</div>
				</div>
				<div class="elementor-element elementor-element-06bf962 elementor-widget elementor-widget-text-editor" data-id="06bf962" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<h5 data-start="49" data-end="91"><strong data-start="54" data-end="89">1. Automating Routine Processes</strong></h5><p data-start="92" data-end="294">AI agents can handle repetitive tasks such as customer inquiries, document analysis, and data management. By automating these processes, businesses can reduce operational costs and improve efficiency.</p><p data-start="92" data-end="294"> </p><h5 data-start="296" data-end="344"><strong data-start="301" data-end="342">2. Personalized Customer Interactions</strong></h5><p data-start="345" data-end="506">By analyzing data, AI agents can provide personalized recommendations and tailored offers, enhancing customer engagement and improving overall user experience.</p><p data-start="345" data-end="506"> </p><h5 data-start="508" data-end="544"><strong data-start="513" data-end="542">3. Speed and Availability</strong></h5><p data-start="545" data-end="739">AI operates 24/7, delivering instant responses and real-time support. This is particularly valuable in industries that require quick reaction times, such as e-commerce, finance, and logistics.</p><p data-start="545" data-end="739"> </p><h5 data-start="741" data-end="777"><strong data-start="746" data-end="775">4. Advanced Data Analysis</strong></h5><p data-start="778" data-end="931">AI-powered agents can process vast amounts of data in a short time, identifying patterns and correlations that support better business decision-making.</p><p data-start="778" data-end="931"> </p><h5 data-start="933" data-end="983"><strong data-start="938" data-end="981">5. Optimizing Decision-Making Processes</strong></h5><p data-start="984" data-end="1145">With predictive modeling, AI assists in demand forecasting, risk management, and supply chain optimization, helping organizations make more informed decisions.</p><p data-start="984" data-end="1145"> </p><h5 data-start="1147" data-end="1203"><strong data-start="1152" data-end="1201">6. Seamless Integration with Existing Systems</strong></h5><p data-start="1204" data-end="1369">Modern AI solutions can be easily integrated into existing ERP, CRM, and analytics platforms, enhancing their capabilities and improving overall system efficiency.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-11dd40f elementor-widget elementor-widget-heading" data-id="11dd40f" data-element_type="widget" data-widget_type="heading.default">
				<div class="elementor-widget-container">
			<h3 class="elementor-heading-title elementor-size-default">A Practical Example of AI Agent Use in the Transport Industry</h3>		</div>
				</div>
				<div class="elementor-element elementor-element-49baa37 elementor-widget__width-initial elementor-widget elementor-widget-video" data-id="49baa37" data-element_type="widget" data-settings="{&quot;youtube_url&quot;:&quot;https:\/\/youtu.be\/B4VxxjWYzDM&quot;,&quot;video_type&quot;:&quot;youtube&quot;,&quot;controls&quot;:&quot;yes&quot;}" data-widget_type="video.default">
				<div class="elementor-widget-container">
					<div class="elementor-wrapper elementor-open-inline">
			<div class="elementor-video"></div>		</div>
				</div>
				</div>
				<div class="elementor-element elementor-element-a9b9980 elementor-widget elementor-widget-text-editor" data-id="a9b9980" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>AI agents can be applied across various industries, including banking, sales, and human resource management. In this text, we will focus on a freight forwarding company that handles anywhere from a few to dozens of shipments daily.</p><p> </p><p> </p><p>Freight forwarders deal with constant communication and the verification of numerous documents. Each of these tasks takes time—a resource that is often in short supply—making errors more likely when the workload is high.</p><p> </p><p> </p><p>How can time management be improved? By automating repetitive and predictable tasks. This is where an AI Agent comes in. Here’s an example of an AI assistant we developed, powered by <a href="https://gemini.google.com/app?hl=pl">Google’s Large Language Model, Gemini.</a></p><p> </p><p>One possible application is the following scenario:</p><p> </p><p> </p><p>A freight forwarder receives an email that should include an insurance policy along with proof of payment. The AI Agent automatically, without needing to be prompted, checks whether the email contains the required attachments. If they are included, it proceeds to verify the following details:</p>						</div>
				</div>
				<div class="elementor-element elementor-element-d2f738d elementor-widget elementor-widget-text-editor" data-id="d2f738d" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p><strong>In the Insurance Policy:</strong></p><ul><li style="list-style-type: none;"><ul><li style="list-style-type: none;"><ul><li>Policy number</li><li>Insurance period and whether it is currently valid</li><li>Insured party details, including tax identification number and address</li><li>Bank account number for premium payment</li></ul></li></ul></li></ul><p><strong>In the Payment Confirmation:</strong></p><ul><li style="list-style-type: none;"><ul><li style="list-style-type: none;"><ul><li>Payment reference</li><li>Amount</li><li>Bank account number</li><li>Payment date</li><li>Whether the transfer corresponds to the submitted policy (e.g., based on the reference, account number)</li></ul></li></ul></li></ul>						</div>
				</div>
				<div class="elementor-element elementor-element-3edb3a5 elementor-widget elementor-widget-image" data-id="3edb3a5" data-element_type="widget" data-widget_type="image.default">
				<div class="elementor-widget-container">
													<img loading="lazy" decoding="async" width="1030" height="366" src="https://inero-software.com/wp-content/uploads/2025/02/analysis-take1-1030x366.png" class="attachment-large size-large wp-image-7334" alt="" srcset="https://inero-software.com/wp-content/uploads/2025/02/analysis-take1-1030x366.png 1030w, https://inero-software.com/wp-content/uploads/2025/02/analysis-take1-300x107.png 300w, https://inero-software.com/wp-content/uploads/2025/02/analysis-take1-768x273.png 768w, https://inero-software.com/wp-content/uploads/2025/02/analysis-take1-1536x546.png 1536w, https://inero-software.com/wp-content/uploads/2025/02/analysis-take1-844x300.png 844w, https://inero-software.com/wp-content/uploads/2025/02/analysis-take1.png 1722w" sizes="(max-width: 1030px) 100vw, 1030px" data-attachment-id="7334" data-permalink="https://inero-software.com/pl/poznaj-swojego-osobistego-agenta-ai-case-study-dla-firmy-spedycyjnej/analysis-take1/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/02/analysis-take1.png" data-orig-size="1722,612" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="analysis-take1" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/02/analysis-take1-300x107.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/02/analysis-take1-1030x366.png" role="button" />													</div>
				</div>
				<div class="elementor-element elementor-element-a59477b elementor-widget elementor-widget-text-editor" data-id="a59477b" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>The AI Agent then transfers the extracted data into a designated Excel file, which is continuously updated. The data file can be formatted accordingly, for example, by highlighting entries in red where the insurance policy is invalid or the payment has not been verified. </p>						</div>
				</div>
				<div class="elementor-element elementor-element-ba91f9f elementor-widget elementor-widget-image" data-id="ba91f9f" data-element_type="widget" data-widget_type="image.default">
				<div class="elementor-widget-container">
													<img loading="lazy" decoding="async" width="1030" height="402" src="https://inero-software.com/wp-content/uploads/2025/02/Zrzut-ekranu-2025-02-21-112751-1030x402.png" class="attachment-large size-large wp-image-7335" alt="" srcset="https://inero-software.com/wp-content/uploads/2025/02/Zrzut-ekranu-2025-02-21-112751-1030x402.png 1030w, https://inero-software.com/wp-content/uploads/2025/02/Zrzut-ekranu-2025-02-21-112751-300x117.png 300w, https://inero-software.com/wp-content/uploads/2025/02/Zrzut-ekranu-2025-02-21-112751-768x299.png 768w, https://inero-software.com/wp-content/uploads/2025/02/Zrzut-ekranu-2025-02-21-112751-1536x599.png 1536w, https://inero-software.com/wp-content/uploads/2025/02/Zrzut-ekranu-2025-02-21-112751-770x300.png 770w, https://inero-software.com/wp-content/uploads/2025/02/Zrzut-ekranu-2025-02-21-112751.png 1539w" sizes="(max-width: 1030px) 100vw, 1030px" data-attachment-id="7335" data-permalink="https://inero-software.com/pl/poznaj-swojego-osobistego-agenta-ai-case-study-dla-firmy-spedycyjnej/zrzut-ekranu-2025-02-21-112751/" data-orig-file="https://inero-software.com/wp-content/uploads/2025/02/Zrzut-ekranu-2025-02-21-112751.png" data-orig-size="1539,600" data-comments-opened="0" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="Zrzut ekranu 2025-02-21 112751" data-image-description="" data-image-caption="" data-medium-file="https://inero-software.com/wp-content/uploads/2025/02/Zrzut-ekranu-2025-02-21-112751-300x117.png" data-large-file="https://inero-software.com/wp-content/uploads/2025/02/Zrzut-ekranu-2025-02-21-112751-1030x402.png" role="button" />													</div>
				</div>
				<div class="elementor-element elementor-element-5abc3ea elementor-widget elementor-widget-text-editor" data-id="5abc3ea" data-element_type="widget" data-widget_type="text-editor.default">
				<div class="elementor-widget-container">
							<p>In this simple way, instead of searching through their inbox for the right emails, the freight forwarder can check the Excel file to see if the documents have been received from a specific sender and whether they are correct. This saves a significant amount of time and ensures data accuracy.</p><p> </p><p>There are many ways to further develop our AI Assistant. It can be integrated with other tools, such as Slack or other communication platforms, to send notifications about missing documents or generate automated email responses. An AI-powered agent can be tailored to the specific needs of a company, a department, or even an individual role.</p>						</div>
				</div>
				<div class="elementor-element elementor-element-aee5ea0 elementor-cta--skin-cover elementor-widget__width-inherit elementor-hidden-mobile elementor-animated-content elementor-bg-transform elementor-bg-transform-zoom-in elementor-widget elementor-widget-call-to-action" data-id="aee5ea0" data-element_type="widget" data-widget_type="call-to-action.default">
				<div class="elementor-widget-container">
					<div class="elementor-cta">
					<div class="elementor-cta__bg-wrapper">
				<div class="elementor-cta__bg elementor-bg" style="background-image: url(https://inero-software.com/wp-content/uploads/2025/02/cta-AI2-1030x579.png);" role="img" aria-label="cta AI2"></div>
				<div class="elementor-cta__bg-overlay"></div>
			</div>
							<div class="elementor-cta__content">
				
									<h2 class="elementor-cta__title elementor-cta__content-item elementor-content-item elementor-animated-item--grow">
						Do you want to explore the possibilities of AI Agents?​					</h2>
				
									<div class="elementor-cta__description elementor-cta__content-item elementor-content-item elementor-animated-item--grow">
						Schedule a meeting. We’d be happy to discuss the possibilities.					</div>
				
									<div class="elementor-cta__button-wrapper elementor-cta__content-item elementor-content-item elementor-animated-item--grow">
					<a class="elementor-cta__button elementor-button elementor-size-" href="https://calendar.google.com/calendar/u/0/appointments/schedules/AcZssZ3e3C_1YeBkt1uCr_qfOnG_N298UgLFwORcSTXigrPfOk0ls3ok-Uw_dSeGCoLdtYsN13GMm-n-">
						SCHEDULE A MEETING					</a>
					</div>
							</div>
						</div>
				</div>
				</div>
					</div>
				</div>
				</div>
		<p>Artykuł <a href="https://inero-software.com/meet-your-personal-ai-agent-a-case-study-for-a-freight-forwarding-company/">Meet Your Personal AI Agent: A Case Study for a Freight Forwarding Company</a> pochodzi z serwisu <a href="https://inero-software.com">Inero Software - Software Consulting</a>.</p>
]]></content:encoded>
					
		
		
		<post-id xmlns="com-wordpress:feed-additions:1">7341</post-id>	</item>
	</channel>
</rss>
