Spaces:
Running
Running
<html xmlns="http://www.w3.org/1999/xhtml" lang="en" xml:lang="en"><head> | |
<meta charset="utf-8"> | |
<meta name="generator" content="quarto-1.3.361"> | |
<meta name="viewport" content="width=device-width, initial-scale=1.0, user-scalable=yes"> | |
<meta name="description" content="Exploring computer vision for vegan ingredient inferencing."> | |
<title>lv-recipe-chatbot - ingredient_vision</title> | |
<style> | |
code{white-space: pre-wrap;} | |
span.smallcaps{font-variant: small-caps;} | |
div.columns{display: flex; gap: min(4vw, 1.5em);} | |
div.column{flex: auto; overflow-x: auto;} | |
div.hanging-indent{margin-left: 1.5em; text-indent: -1.5em;} | |
ul.task-list{list-style: none;} | |
ul.task-list li input[type="checkbox"] { | |
width: 0.8em; | |
margin: 0 0.8em 0.2em -1em; /* quarto-specific, see https://github.com/quarto-dev/quarto-cli/issues/4556 */ | |
vertical-align: middle; | |
} | |
/* CSS for syntax highlighting */ | |
pre > code.sourceCode { white-space: pre; position: relative; } | |
pre > code.sourceCode > span { display: inline-block; line-height: 1.25; } | |
pre > code.sourceCode > span:empty { height: 1.2em; } | |
.sourceCode { overflow: visible; } | |
code.sourceCode > span { color: inherit; text-decoration: inherit; } | |
div.sourceCode { margin: 1em 0; } | |
pre.sourceCode { margin: 0; } | |
@media screen { | |
div.sourceCode { overflow: auto; } | |
} | |
@media print { | |
pre > code.sourceCode { white-space: pre-wrap; } | |
pre > code.sourceCode > span { text-indent: -5em; padding-left: 5em; } | |
} | |
pre.numberSource code | |
{ counter-reset: source-line 0; } | |
pre.numberSource code > span | |
{ position: relative; left: -4em; counter-increment: source-line; } | |
pre.numberSource code > span > a:first-child::before | |
{ content: counter(source-line); | |
position: relative; left: -1em; text-align: right; vertical-align: baseline; | |
border: none; display: inline-block; | |
-webkit-touch-callout: none; -webkit-user-select: none; | |
-khtml-user-select: none; -moz-user-select: none; | |
-ms-user-select: none; user-select: none; | |
padding: 0 4px; width: 4em; | |
} | |
pre.numberSource { margin-left: 3em; padding-left: 4px; } | |
div.sourceCode | |
{ } | |
@media screen { | |
pre > code.sourceCode > span > a:first-child::before { text-decoration: underline; } | |
} | |
</style> | |
<script src="site_libs/quarto-nav/quarto-nav.js"></script> | |
<script src="site_libs/quarto-nav/headroom.min.js"></script> | |
<script src="site_libs/clipboard/clipboard.min.js"></script> | |
<script src="site_libs/quarto-search/autocomplete.umd.js"></script> | |
<script src="site_libs/quarto-search/fuse.min.js"></script> | |
<script src="site_libs/quarto-search/quarto-search.js"></script> | |
<meta name="quarto:offset" content="./"> | |
<script src="site_libs/quarto-html/quarto.js"></script> | |
<script src="site_libs/quarto-html/popper.min.js"></script> | |
<script src="site_libs/quarto-html/tippy.umd.min.js"></script> | |
<script src="site_libs/quarto-html/anchor.min.js"></script> | |
<link href="site_libs/quarto-html/tippy.css" rel="stylesheet"> | |
<link href="site_libs/quarto-html/quarto-syntax-highlighting.css" rel="stylesheet" id="quarto-text-highlighting-styles"> | |
<script src="site_libs/bootstrap/bootstrap.min.js"></script> | |
<link href="site_libs/bootstrap/bootstrap-icons.css" rel="stylesheet"> | |
<link href="site_libs/bootstrap/bootstrap.min.css" rel="stylesheet" id="quarto-bootstrap" data-mode="light"> | |
<script id="quarto-search-options" type="application/json">{ | |
"location": "navbar", | |
"copy-button": false, | |
"collapse-after": 3, | |
"panel-placement": "end", | |
"type": "overlay", | |
"limit": 20, | |
"language": { | |
"search-no-results-text": "No results", | |
"search-matching-documents-text": "matching documents", | |
"search-copy-link-title": "Copy link to search", | |
"search-hide-matches-text": "Hide additional matches", | |
"search-more-match-text": "more match in this document", | |
"search-more-matches-text": "more matches in this document", | |
"search-clear-button-title": "Clear", | |
"search-detached-cancel-button-title": "Cancel", | |
"search-submit-button-title": "Submit", | |
"search-label": "Search" | |
} | |
}</script> | |
<link rel="stylesheet" href="styles.css"> | |
<meta property="og:title" content="lv-recipe-chatbot - ingredient_vision"> | |
<meta property="og:description" content="Exploring computer vision for vegan ingredient inferencing."> | |
<meta property="og:image" content="https://animalequality.github.io/lv-recipe-chatbot/03_ingredient_vision_files/figure-html/cell-8-output-1.png"> | |
<meta property="og:site-name" content="lv-recipe-chatbot"> | |
<meta property="og:image:height" content="256"> | |
<meta property="og:image:width" content="512"> | |
<meta name="twitter:title" content="lv-recipe-chatbot - ingredient_vision"> | |
<meta name="twitter:description" content="Exploring computer vision for vegan ingredient inferencing."> | |
<meta name="twitter:image" content="https://animalequality.github.io/lv-recipe-chatbot/03_ingredient_vision_files/figure-html/cell-8-output-1.png"> | |
<meta name="twitter:image-height" content="256"> | |
<meta name="twitter:image-width" content="512"> | |
<meta name="twitter:card" content="summary_large_image"> | |
</head> | |
<body class="nav-sidebar floating nav-fixed"> | |
<div id="quarto-search-results"></div> | |
<header id="quarto-header" class="headroom fixed-top"> | |
<nav class="navbar navbar-expand-lg navbar-dark "> | |
<div class="navbar-container container-fluid"> | |
<div class="navbar-brand-container"> | |
<a class="navbar-brand" href="./index.html"> | |
<span class="navbar-title">lv-recipe-chatbot</span> | |
</a> | |
</div> | |
<div class="quarto-navbar-tools ms-auto"> | |
</div> | |
<div id="quarto-search" class="" title="Search"></div> | |
</div> <!-- /container-fluid --> | |
</nav> | |
<nav class="quarto-secondary-nav"> | |
<div class="container-fluid d-flex"> | |
<button type="button" class="quarto-btn-toggle btn" data-bs-toggle="collapse" data-bs-target="#quarto-sidebar,#quarto-sidebar-glass" aria-controls="quarto-sidebar" aria-expanded="false" aria-label="Toggle sidebar navigation" onclick="if (window.quartoToggleHeadroom) { window.quartoToggleHeadroom(); }"> | |
<i class="bi bi-layout-text-sidebar-reverse"></i> | |
</button> | |
<nav class="quarto-page-breadcrumbs" aria-label="breadcrumb"><ol class="breadcrumb"><li class="breadcrumb-item"><a href="./ingredient_vision.html">ingredient_vision</a></li></ol></nav> | |
<a class="flex-grow-1" role="button" data-bs-toggle="collapse" data-bs-target="#quarto-sidebar,#quarto-sidebar-glass" aria-controls="quarto-sidebar" aria-expanded="false" aria-label="Toggle sidebar navigation" onclick="if (window.quartoToggleHeadroom) { window.quartoToggleHeadroom(); }"> | |
</a> | |
</div> | |
</nav> | |
</header> | |
<!-- content --> | |
<div id="quarto-content" class="quarto-container page-columns page-rows-contents page-layout-article page-navbar"> | |
<!-- sidebar --> | |
<nav id="quarto-sidebar" class="sidebar collapse collapse-horizontal sidebar-navigation floating overflow-auto"> | |
<div class="sidebar-menu-container"> | |
<ul class="list-unstyled mt-1"> | |
<li class="sidebar-item"> | |
<div class="sidebar-item-container"> | |
<a href="./index.html" class="sidebar-item-text sidebar-link"> | |
<span class="menu-text">lv-recipe-chatbot</span></a> | |
</div> | |
</li> | |
<li class="sidebar-item"> | |
<div class="sidebar-item-container"> | |
<a href="./engineer_prompt.html" class="sidebar-item-text sidebar-link"> | |
<span class="menu-text">engineer_prompt</span></a> | |
</div> | |
</li> | |
<li class="sidebar-item"> | |
<div class="sidebar-item-container"> | |
<a href="./app.html" class="sidebar-item-text sidebar-link"> | |
<span class="menu-text">app</span></a> | |
</div> | |
</li> | |
<li class="sidebar-item"> | |
<div class="sidebar-item-container"> | |
<a href="./lchain_tool.html" class="sidebar-item-text sidebar-link"> | |
<span class="menu-text">lchain_tool</span></a> | |
</div> | |
</li> | |
<li class="sidebar-item"> | |
<div class="sidebar-item-container"> | |
<a href="./ingredient_vision.html" class="sidebar-item-text sidebar-link active"> | |
<span class="menu-text">ingredient_vision</span></a> | |
</div> | |
</li> | |
<li class="sidebar-item"> | |
<div class="sidebar-item-container"> | |
<a href="./edamam_api.html" class="sidebar-item-text sidebar-link"> | |
<span class="menu-text">edamam_api</span></a> | |
</div> | |
</li> | |
</ul> | |
</div> | |
</nav> | |
<div id="quarto-sidebar-glass" data-bs-toggle="collapse" data-bs-target="#quarto-sidebar,#quarto-sidebar-glass"></div> | |
<!-- margin-sidebar --> | |
<div id="quarto-margin-sidebar" class="sidebar margin-sidebar"> | |
<nav id="TOC" role="doc-toc" class="toc-active"> | |
<h2 id="toc-title">On this page</h2> | |
<ul> | |
<li><a href="#format_image" id="toc-format_image" class="nav-link active" data-scroll-target="#format_image">format_image</a></li> | |
<li><a href="#blipimagecaptioning" id="toc-blipimagecaptioning" class="nav-link" data-scroll-target="#blipimagecaptioning">BlipImageCaptioning</a></li> | |
<li><a href="#blipimagecaptioning.inference" id="toc-blipimagecaptioning.inference" class="nav-link" data-scroll-target="#blipimagecaptioning.inference">BlipImageCaptioning.inference</a></li> | |
<li><a href="#blipvqa" id="toc-blipvqa" class="nav-link" data-scroll-target="#blipvqa">BlipVQA</a></li> | |
<li><a href="#blipvqa.inference" id="toc-blipvqa.inference" class="nav-link" data-scroll-target="#blipvqa.inference">BlipVQA.inference</a></li> | |
<li><a href="#veganingredientfinder" id="toc-veganingredientfinder" class="nav-link" data-scroll-target="#veganingredientfinder">VeganIngredientFinder</a></li> | |
<li><a href="#veganingredientfinder.list_ingredients" id="toc-veganingredientfinder.list_ingredients" class="nav-link" data-scroll-target="#veganingredientfinder.list_ingredients">VeganIngredientFinder.list_ingredients</a></li> | |
</ul> | |
<div class="toc-actions"><div><i class="bi bi-git"></i></div><div class="action-links"><p><a href="https://gitlab.com/animalequality/lv-recipe-chatbot/issues/new" class="toc-action">Report an issue</a></p></div></div></nav> | |
</div> | |
<!-- main --> | |
<main class="content" id="quarto-document-content"> | |
<header id="title-block-header" class="quarto-title-block default"> | |
<div class="quarto-title"> | |
<h1 class="title">ingredient_vision</h1> | |
</div> | |
<div> | |
<div class="description"> | |
Exploring computer vision for vegan ingredient inferencing. | |
</div> | |
</div> | |
<div class="quarto-title-meta"> | |
</div> | |
</header> | |
<!-- WARNING: THIS FILE WAS AUTOGENERATED! DO NOT EDIT! --> | |
<p>Inspiration drawn from <a href="https://github.com/microsoft/TaskMatrix">TaskMartix aka Visual ChatGPT</a></p> | |
<hr> | |
<p><a href="https://gitlab.com/animalequality/lv-recipe-chatbot/blob/main/lv_recipe_chatbot/ingredient_vision.py#L24" target="_blank" style="float:right; font-size:smaller">source</a></p> | |
<section id="format_image" class="level3"> | |
<h3 class="anchored" data-anchor-id="format_image">format_image</h3> | |
<blockquote class="blockquote"> | |
<pre><code> format_image (image:str)</code></pre> | |
</blockquote> | |
<table class="table"> | |
<thead> | |
<tr class="header"> | |
<th></th> | |
<th><strong>Type</strong></th> | |
<th><strong>Details</strong></th> | |
</tr> | |
</thead> | |
<tbody> | |
<tr class="odd"> | |
<td>image</td> | |
<td>str</td> | |
<td>Image file path</td> | |
</tr> | |
</tbody> | |
</table> | |
<hr> | |
<p><a href="https://gitlab.com/animalequality/lv-recipe-chatbot/blob/main/lv_recipe_chatbot/ingredient_vision.py#L36" target="_blank" style="float:right; font-size:smaller">source</a></p> | |
</section> | |
<section id="blipimagecaptioning" class="level3"> | |
<h3 class="anchored" data-anchor-id="blipimagecaptioning">BlipImageCaptioning</h3> | |
<blockquote class="blockquote"> | |
<pre><code> BlipImageCaptioning (device:str)</code></pre> | |
</blockquote> | |
<p>Useful when you want to know what is inside the photo.</p> | |
<hr> | |
<p><a href="https://gitlab.com/animalequality/lv-recipe-chatbot/blob/main/lv_recipe_chatbot/ingredient_vision.py#L51" target="_blank" style="float:right; font-size:smaller">source</a></p> | |
</section> | |
<section id="blipimagecaptioning.inference" class="level3"> | |
<h3 class="anchored" data-anchor-id="blipimagecaptioning.inference">BlipImageCaptioning.inference</h3> | |
<blockquote class="blockquote"> | |
<pre><code> BlipImageCaptioning.inference | |
(image:<module'PIL.Image'from'/home/evylz/ | |
AnimalEquality/lv-recipe- | |
chatbot/env/lib/python3.10/site- | |
packages/PIL/Image.py'>)</code></pre> | |
</blockquote> | |
<table class="table"> | |
<thead> | |
<tr class="header"> | |
<th></th> | |
<th><strong>Type</strong></th> | |
<th><strong>Details</strong></th> | |
</tr> | |
</thead> | |
<tbody> | |
<tr class="odd"> | |
<td>image</td> | |
<td>PIL.Image</td> | |
<td></td> | |
</tr> | |
<tr class="even"> | |
<td><strong>Returns</strong></td> | |
<td><strong>str</strong></td> | |
<td><strong>Caption for the image</strong></td> | |
</tr> | |
</tbody> | |
</table> | |
<hr> | |
<p><a href="https://gitlab.com/animalequality/lv-recipe-chatbot/blob/main/lv_recipe_chatbot/ingredient_vision.py#L60" target="_blank" style="float:right; font-size:smaller">source</a></p> | |
</section> | |
<section id="blipvqa" class="level3"> | |
<h3 class="anchored" data-anchor-id="blipvqa">BlipVQA</h3> | |
<blockquote class="blockquote"> | |
<pre><code> BlipVQA (device:str)</code></pre> | |
</blockquote> | |
<p>BLIP Visual Question Answering Useful when you need an answer for a question based on an image. Examples: what is the background color of this image, how many cats are in this figure, what is in this figure?</p> | |
<hr> | |
<p><a href="https://gitlab.com/animalequality/lv-recipe-chatbot/blob/main/lv_recipe_chatbot/ingredient_vision.py#L76" target="_blank" style="float:right; font-size:smaller">source</a></p> | |
</section> | |
<section id="blipvqa.inference" class="level3"> | |
<h3 class="anchored" data-anchor-id="blipvqa.inference">BlipVQA.inference</h3> | |
<blockquote class="blockquote"> | |
<pre><code> BlipVQA.inference | |
(image:<module'PIL.Image'from'/home/evylz/AnimalEquali | |
ty/lv-recipe-chatbot/env/lib/python3.10/site- | |
packages/PIL/Image.py'>, question:str)</code></pre> | |
</blockquote> | |
<table class="table"> | |
<thead> | |
<tr class="header"> | |
<th></th> | |
<th><strong>Type</strong></th> | |
<th><strong>Details</strong></th> | |
</tr> | |
</thead> | |
<tbody> | |
<tr class="odd"> | |
<td>image</td> | |
<td>PIL.Image</td> | |
<td></td> | |
</tr> | |
<tr class="even"> | |
<td>question</td> | |
<td>str</td> | |
<td></td> | |
</tr> | |
<tr class="odd"> | |
<td><strong>Returns</strong></td> | |
<td><strong>str</strong></td> | |
<td><strong>Answer to the query on the image</strong></td> | |
</tr> | |
</tbody> | |
</table> | |
<div class="cell"> | |
<div class="sourceCode cell-code" id="cb6"><pre class="sourceCode python code-with-copy"><code class="sourceCode python"><span id="cb6-1"><a href="#cb6-1" aria-hidden="true" tabindex="-1"></a>sample_images <span class="op">=</span> os.listdir(SAMPLE_IMG_DIR)</span> | |
<span id="cb6-2"><a href="#cb6-2" aria-hidden="true" tabindex="-1"></a>sample_images</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div> | |
<div class="cell-output cell-output-display"> | |
<pre><code>['veggie-fridge.jpeg', | |
'veg-groceries-table.jpg', | |
'fridge-splendid.jpg', | |
'neat-veg-groceries.jpg', | |
'veg-groceries-table.jpeg', | |
'Fruits-and-vegetables-one-a-table.jpg']</code></pre> | |
</div> | |
</div> | |
<div class="cell"> | |
<div class="sourceCode cell-code" id="cb8"><pre class="sourceCode python code-with-copy"><code class="sourceCode python"><span id="cb8-1"><a href="#cb8-1" aria-hidden="true" tabindex="-1"></a><span class="cf">for</span> img <span class="kw">in</span> sample_images:</span> | |
<span id="cb8-2"><a href="#cb8-2" aria-hidden="true" tabindex="-1"></a> display(format_image(SAMPLE_IMG_DIR <span class="op">/</span> img))</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-8-output-1.png" class="img-fluid"></p> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-8-output-2.png" class="img-fluid"></p> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-8-output-3.png" class="img-fluid"></p> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-8-output-4.png" class="img-fluid"></p> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-8-output-5.png" class="img-fluid"></p> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-8-output-6.png" class="img-fluid"></p> | |
</div> | |
</div> | |
<p>The process:</p> | |
<ol type="1"> | |
<li>Format image</li> | |
<li>Get description (caption)</li> | |
<li>Pass caption and ingredient queries to VQA</li> | |
</ol> | |
<div class="cell"> | |
<div class="sourceCode cell-code" id="cb9"><pre class="sourceCode python code-with-copy"><code class="sourceCode python"><span id="cb9-1"><a href="#cb9-1" aria-hidden="true" tabindex="-1"></a>vqa <span class="op">=</span> BlipVQA(<span class="st">"cpu"</span>)</span> | |
<span id="cb9-2"><a href="#cb9-2" aria-hidden="true" tabindex="-1"></a>img_cap <span class="op">=</span> BlipImageCaptioning(<span class="st">"cpu"</span>)</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div> | |
</div> | |
<div class="cell"> | |
<div class="sourceCode cell-code" id="cb10"><pre class="sourceCode python code-with-copy"><code class="sourceCode python"><span id="cb10-1"><a href="#cb10-1" aria-hidden="true" tabindex="-1"></a><span class="cf">for</span> img <span class="kw">in</span> sample_images:</span> | |
<span id="cb10-2"><a href="#cb10-2" aria-hidden="true" tabindex="-1"></a> img <span class="op">=</span> format_image(SAMPLE_IMG_DIR <span class="op">/</span> img)</span> | |
<span id="cb10-3"><a href="#cb10-3" aria-hidden="true" tabindex="-1"></a></span> | |
<span id="cb10-4"><a href="#cb10-4" aria-hidden="true" tabindex="-1"></a> display(desc, img.resize((<span class="bu">int</span>(img.size[<span class="dv">0</span>] <span class="op">*</span> <span class="fl">0.5</span>), <span class="bu">int</span>(img.size[<span class="dv">1</span>] <span class="op">*</span> <span class="fl">0.5</span>))))</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div> | |
<div class="cell-output cell-output-stdout"> | |
<pre><code>CPU times: user 11.4 s, sys: 7.42 ms, total: 11.4 s | |
Wall time: 1.19 s | |
CPU times: user 13.5 s, sys: 7.5 ms, total: 13.5 s | |
Wall time: 1.36 s | |
CPU times: user 12 s, sys: 0 ns, total: 12 s | |
Wall time: 1.21 s | |
CPU times: user 12.5 s, sys: 0 ns, total: 12.5 s | |
Wall time: 1.27 s | |
CPU times: user 9.25 s, sys: 7.71 ms, total: 9.25 s | |
Wall time: 936 ms | |
CPU times: user 15.7 s, sys: 7.66 ms, total: 15.7 s | |
Wall time: 1.58 s</code></pre> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<pre><code>'a refrigerator with food inside'</code></pre> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-10-output-3.png" class="img-fluid"></p> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<pre><code>'a table with a variety of fruits and vegetables'</code></pre> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-10-output-5.png" class="img-fluid"></p> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<pre><code>'a refrigerator filled with food and drinks'</code></pre> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-10-output-7.png" class="img-fluid"></p> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<pre><code>'a counter with various foods on it'</code></pre> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-10-output-9.png" class="img-fluid"></p> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<pre><code>'a wooden table'</code></pre> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-10-output-11.png" class="img-fluid"></p> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<pre><code>'a table with a variety of fruits and vegetables'</code></pre> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-10-output-13.png" class="img-fluid"></p> | |
</div> | |
</div> | |
<div class="cell"> | |
<div class="sourceCode cell-code" id="cb18"><pre class="sourceCode python code-with-copy"><code class="sourceCode python"><span id="cb18-1"><a href="#cb18-1" aria-hidden="true" tabindex="-1"></a><span class="cf">for</span> img <span class="kw">in</span> sample_images:</span> | |
<span id="cb18-2"><a href="#cb18-2" aria-hidden="true" tabindex="-1"></a> img <span class="op">=</span> format_image(SAMPLE_IMG_DIR <span class="op">/</span> img)</span> | |
<span id="cb18-3"><a href="#cb18-3" aria-hidden="true" tabindex="-1"></a> desc <span class="op">=</span> img_cap.inference(img)</span> | |
<span id="cb18-4"><a href="#cb18-4" aria-hidden="true" tabindex="-1"></a></span> | |
<span id="cb18-5"><a href="#cb18-5" aria-hidden="true" tabindex="-1"></a> answer <span class="op">+=</span> <span class="st">"</span><span class="ch">\n</span><span class="st">"</span> <span class="op">+</span> vqa.inference(</span> | |
<span id="cb18-6"><a href="#cb18-6" aria-hidden="true" tabindex="-1"></a> img, <span class="ss">f"What are three of the fruits seen in the image if any?"</span></span> | |
<span id="cb18-7"><a href="#cb18-7" aria-hidden="true" tabindex="-1"></a> )</span> | |
<span id="cb18-8"><a href="#cb18-8" aria-hidden="true" tabindex="-1"></a> answer <span class="op">+=</span> <span class="st">"</span><span class="ch">\n</span><span class="st">"</span> <span class="op">+</span> vqa.inference(</span> | |
<span id="cb18-9"><a href="#cb18-9" aria-hidden="true" tabindex="-1"></a> img, <span class="ss">f"What grains and starches are in the image if any?"</span></span> | |
<span id="cb18-10"><a href="#cb18-10" aria-hidden="true" tabindex="-1"></a> )</span> | |
<span id="cb18-11"><a href="#cb18-11" aria-hidden="true" tabindex="-1"></a> answer <span class="op">+=</span> <span class="st">"</span><span class="ch">\n</span><span class="st">"</span> <span class="op">+</span> vqa.inference(img, <span class="ss">f"Is there plant-based milk in the image?"</span>)</span> | |
<span id="cb18-12"><a href="#cb18-12" aria-hidden="true" tabindex="-1"></a> <span class="bu">print</span>(</span> | |
<span id="cb18-13"><a href="#cb18-13" aria-hidden="true" tabindex="-1"></a> <span class="ss">f"""</span><span class="sc">{</span>desc<span class="sc">}</span></span> | |
<span id="cb18-14"><a href="#cb18-14" aria-hidden="true" tabindex="-1"></a><span class="sc">{</span>answer<span class="sc">}</span><span class="ss">"""</span></span> | |
<span id="cb18-15"><a href="#cb18-15" aria-hidden="true" tabindex="-1"></a> )</span> | |
<span id="cb18-16"><a href="#cb18-16" aria-hidden="true" tabindex="-1"></a> display(img.resize((<span class="bu">int</span>(img.size[<span class="dv">0</span>] <span class="op">*</span> <span class="fl">0.75</span>), <span class="bu">int</span>(img.size[<span class="dv">1</span>] <span class="op">*</span> <span class="fl">0.75</span>))))</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div> | |
<div class="cell-output cell-output-stdout"> | |
<pre><code>CPU times: user 7.67 s, sys: 12.1 ms, total: 7.68 s | |
Wall time: 779 ms | |
a refrigerator with food inside | |
cabbage lettuce onion | |
apples | |
rice | |
yes | |
CPU times: user 10.5 s, sys: 8.13 ms, total: 10.5 s | |
Wall time: 1.06 s | |
a table with a variety of fruits and vegetables | |
broccoli and tomatoes | |
bananas apples oranges | |
potatoes | |
yes | |
CPU times: user 11.7 s, sys: 0 ns, total: 11.7 s | |
Wall time: 1.18 s | |
a refrigerator filled with food and drinks | |
broccoli and zucchini | |
bananas | |
rice | |
yes | |
CPU times: user 11.5 s, sys: 12.2 ms, total: 11.5 s | |
Wall time: 1.16 s | |
a counter with various foods on it | |
carrots and broccoli | |
apples bananas and tomatoes | |
rice | |
yes | |
CPU times: user 9.62 s, sys: 4.22 ms, total: 9.63 s | |
Wall time: 973 ms | |
a wooden table | |
potatoes and carrots | |
apples | |
potatoes | |
yes | |
CPU times: user 11.1 s, sys: 8.23 ms, total: 11.1 s | |
Wall time: 1.12 s | |
a table with a variety of fruits and vegetables | |
peppers broccoli and squash | |
watermelon limes and pineapple | |
rice | |
no</code></pre> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-11-output-2.png" class="img-fluid"></p> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-11-output-3.png" class="img-fluid"></p> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-11-output-4.png" class="img-fluid"></p> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-11-output-5.png" class="img-fluid"></p> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-11-output-6.png" class="img-fluid"></p> | |
</div> | |
<div class="cell-output cell-output-display"> | |
<p><img src="03_ingredient_vision_files/figure-html/cell-11-output-7.png" class="img-fluid"></p> | |
</div> | |
</div> | |
<hr> | |
<p><a href="https://gitlab.com/animalequality/lv-recipe-chatbot/blob/main/lv_recipe_chatbot/ingredient_vision.py#L89" target="_blank" style="float:right; font-size:smaller">source</a></p> | |
</section> | |
<section id="veganingredientfinder" class="level3"> | |
<h3 class="anchored" data-anchor-id="veganingredientfinder">VeganIngredientFinder</h3> | |
<blockquote class="blockquote"> | |
<pre><code> VeganIngredientFinder ()</code></pre> | |
</blockquote> | |
<p>Initialize self. See help(type(self)) for accurate signature.</p> | |
<hr> | |
<p><a href="https://gitlab.com/animalequality/lv-recipe-chatbot/blob/main/lv_recipe_chatbot/ingredient_vision.py#L93" target="_blank" style="float:right; font-size:smaller">source</a></p> | |
</section> | |
<section id="veganingredientfinder.list_ingredients" class="level3"> | |
<h3 class="anchored" data-anchor-id="veganingredientfinder.list_ingredients">VeganIngredientFinder.list_ingredients</h3> | |
<blockquote class="blockquote"> | |
<pre><code> VeganIngredientFinder.list_ingredients (img:str)</code></pre> | |
</blockquote> | |
<table class="table"> | |
<thead> | |
<tr class="header"> | |
<th></th> | |
<th><strong>Type</strong></th> | |
<th><strong>Details</strong></th> | |
</tr> | |
</thead> | |
<tbody> | |
<tr class="odd"> | |
<td>img</td> | |
<td>str</td> | |
<td>Image file path</td> | |
</tr> | |
<tr class="even"> | |
<td><strong>Returns</strong></td> | |
<td><strong>str</strong></td> | |
<td></td> | |
</tr> | |
</tbody> | |
</table> | |
<div class="cell"> | |
<div class="sourceCode cell-code" id="cb22"><pre class="sourceCode python code-with-copy"><code class="sourceCode python"><span id="cb22-1"><a href="#cb22-1" aria-hidden="true" tabindex="-1"></a>vegan_ingred_finder <span class="op">=</span> VeganIngredientFinder()</span> | |
<span id="cb22-2"><a href="#cb22-2" aria-hidden="true" tabindex="-1"></a>vegan_ingred_finder.list_ingredients(SAMPLE_IMG_DIR <span class="op">/</span> sample_images[<span class="dv">0</span>])</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div> | |
<div class="cell-output cell-output-display"> | |
<pre><code>'cabbage lettuce onion\napples\nrice\nplant-based milk'</code></pre> | |
</div> | |
</div> | |
</section> | |
</main> <!-- /main --> | |
<script id="quarto-html-after-body" type="application/javascript"> | |
window.document.addEventListener("DOMContentLoaded", function (event) { | |
const toggleBodyColorMode = (bsSheetEl) => { | |
const mode = bsSheetEl.getAttribute("data-mode"); | |
const bodyEl = window.document.querySelector("body"); | |
if (mode === "dark") { | |
bodyEl.classList.add("quarto-dark"); | |
bodyEl.classList.remove("quarto-light"); | |
} else { | |
bodyEl.classList.add("quarto-light"); | |
bodyEl.classList.remove("quarto-dark"); | |
} | |
} | |
const toggleBodyColorPrimary = () => { | |
const bsSheetEl = window.document.querySelector("link#quarto-bootstrap"); | |
if (bsSheetEl) { | |
toggleBodyColorMode(bsSheetEl); | |
} | |
} | |
toggleBodyColorPrimary(); | |
const icon = ""; | |
const anchorJS = new window.AnchorJS(); | |
anchorJS.options = { | |
placement: 'right', | |
icon: icon | |
}; | |
anchorJS.add('.anchored'); | |
const isCodeAnnotation = (el) => { | |
for (const clz of el.classList) { | |
if (clz.startsWith('code-annotation-')) { | |
return true; | |
} | |
} | |
return false; | |
} | |
const clipboard = new window.ClipboardJS('.code-copy-button', { | |
text: function(trigger) { | |
const codeEl = trigger.previousElementSibling.cloneNode(true); | |
for (const childEl of codeEl.children) { | |
if (isCodeAnnotation(childEl)) { | |
childEl.remove(); | |
} | |
} | |
return codeEl.innerText; | |
} | |
}); | |
clipboard.on('success', function(e) { | |
// button target | |
const button = e.trigger; | |
// don't keep focus | |
button.blur(); | |
// flash "checked" | |
button.classList.add('code-copy-button-checked'); | |
var currentTitle = button.getAttribute("title"); | |
button.setAttribute("title", "Copied!"); | |
let tooltip; | |
if (window.bootstrap) { | |
button.setAttribute("data-bs-toggle", "tooltip"); | |
button.setAttribute("data-bs-placement", "left"); | |
button.setAttribute("data-bs-title", "Copied!"); | |
tooltip = new bootstrap.Tooltip(button, | |
{ trigger: "manual", | |
customClass: "code-copy-button-tooltip", | |
offset: [0, -8]}); | |
tooltip.show(); | |
} | |
setTimeout(function() { | |
if (tooltip) { | |
tooltip.hide(); | |
button.removeAttribute("data-bs-title"); | |
button.removeAttribute("data-bs-toggle"); | |
button.removeAttribute("data-bs-placement"); | |
} | |
button.setAttribute("title", currentTitle); | |
button.classList.remove('code-copy-button-checked'); | |
}, 1000); | |
// clear code selection | |
e.clearSelection(); | |
}); | |
function tippyHover(el, contentFn) { | |
const config = { | |
allowHTML: true, | |
content: contentFn, | |
maxWidth: 500, | |
delay: 100, | |
arrow: false, | |
appendTo: function(el) { | |
return el.parentElement; | |
}, | |
interactive: true, | |
interactiveBorder: 10, | |
theme: 'quarto', | |
placement: 'bottom-start' | |
}; | |
window.tippy(el, config); | |
} | |
const noterefs = window.document.querySelectorAll('a[role="doc-noteref"]'); | |
for (var i=0; i<noterefs.length; i++) { | |
const ref = noterefs[i]; | |
tippyHover(ref, function() { | |
// use id or data attribute instead here | |
let href = ref.getAttribute('data-footnote-href') || ref.getAttribute('href'); | |
try { href = new URL(href).hash; } catch {} | |
const id = href.replace(/^#\/?/, ""); | |
const note = window.document.getElementById(id); | |
return note.innerHTML; | |
}); | |
} | |
let selectedAnnoteEl; | |
const selectorForAnnotation = ( cell, annotation) => { | |
let cellAttr = 'data-code-cell="' + cell + '"'; | |
let lineAttr = 'data-code-annotation="' + annotation + '"'; | |
const selector = 'span[' + cellAttr + '][' + lineAttr + ']'; | |
return selector; | |
} | |
const selectCodeLines = (annoteEl) => { | |
const doc = window.document; | |
const targetCell = annoteEl.getAttribute("data-target-cell"); | |
const targetAnnotation = annoteEl.getAttribute("data-target-annotation"); | |
const annoteSpan = window.document.querySelector(selectorForAnnotation(targetCell, targetAnnotation)); | |
const lines = annoteSpan.getAttribute("data-code-lines").split(","); | |
const lineIds = lines.map((line) => { | |
return targetCell + "-" + line; | |
}) | |
let top = null; | |
let height = null; | |
let parent = null; | |
if (lineIds.length > 0) { | |
//compute the position of the single el (top and bottom and make a div) | |
const el = window.document.getElementById(lineIds[0]); | |
top = el.offsetTop; | |
height = el.offsetHeight; | |
parent = el.parentElement.parentElement; | |
if (lineIds.length > 1) { | |
const lastEl = window.document.getElementById(lineIds[lineIds.length - 1]); | |
const bottom = lastEl.offsetTop + lastEl.offsetHeight; | |
height = bottom - top; | |
} | |
if (top !== null && height !== null && parent !== null) { | |
// cook up a div (if necessary) and position it | |
let div = window.document.getElementById("code-annotation-line-highlight"); | |
if (div === null) { | |
div = window.document.createElement("div"); | |
div.setAttribute("id", "code-annotation-line-highlight"); | |
div.style.position = 'absolute'; | |
parent.appendChild(div); | |
} | |
div.style.top = top - 2 + "px"; | |
div.style.height = height + 4 + "px"; | |
let gutterDiv = window.document.getElementById("code-annotation-line-highlight-gutter"); | |
if (gutterDiv === null) { | |
gutterDiv = window.document.createElement("div"); | |
gutterDiv.setAttribute("id", "code-annotation-line-highlight-gutter"); | |
gutterDiv.style.position = 'absolute'; | |
const codeCell = window.document.getElementById(targetCell); | |
const gutter = codeCell.querySelector('.code-annotation-gutter'); | |
gutter.appendChild(gutterDiv); | |
} | |
gutterDiv.style.top = top - 2 + "px"; | |
gutterDiv.style.height = height + 4 + "px"; | |
} | |
selectedAnnoteEl = annoteEl; | |
} | |
}; | |
const unselectCodeLines = () => { | |
const elementsIds = ["code-annotation-line-highlight", "code-annotation-line-highlight-gutter"]; | |
elementsIds.forEach((elId) => { | |
const div = window.document.getElementById(elId); | |
if (div) { | |
div.remove(); | |
} | |
}); | |
selectedAnnoteEl = undefined; | |
}; | |
// Attach click handler to the DT | |
const annoteDls = window.document.querySelectorAll('dt[data-target-cell]'); | |
for (const annoteDlNode of annoteDls) { | |
annoteDlNode.addEventListener('click', (event) => { | |
const clickedEl = event.target; | |
if (clickedEl !== selectedAnnoteEl) { | |
unselectCodeLines(); | |
const activeEl = window.document.querySelector('dt[data-target-cell].code-annotation-active'); | |
if (activeEl) { | |
activeEl.classList.remove('code-annotation-active'); | |
} | |
selectCodeLines(clickedEl); | |
clickedEl.classList.add('code-annotation-active'); | |
} else { | |
// Unselect the line | |
unselectCodeLines(); | |
clickedEl.classList.remove('code-annotation-active'); | |
} | |
}); | |
} | |
const findCites = (el) => { | |
const parentEl = el.parentElement; | |
if (parentEl) { | |
const cites = parentEl.dataset.cites; | |
if (cites) { | |
return { | |
el, | |
cites: cites.split(' ') | |
}; | |
} else { | |
return findCites(el.parentElement) | |
} | |
} else { | |
return undefined; | |
} | |
}; | |
var bibliorefs = window.document.querySelectorAll('a[role="doc-biblioref"]'); | |
for (var i=0; i<bibliorefs.length; i++) { | |
const ref = bibliorefs[i]; | |
const citeInfo = findCites(ref); | |
if (citeInfo) { | |
tippyHover(citeInfo.el, function() { | |
var popup = window.document.createElement('div'); | |
citeInfo.cites.forEach(function(cite) { | |
var citeDiv = window.document.createElement('div'); | |
citeDiv.classList.add('hanging-indent'); | |
citeDiv.classList.add('csl-entry'); | |
var biblioDiv = window.document.getElementById('ref-' + cite); | |
if (biblioDiv) { | |
citeDiv.innerHTML = biblioDiv.innerHTML; | |
} | |
popup.appendChild(citeDiv); | |
}); | |
return popup.innerHTML; | |
}); | |
} | |
} | |
}); | |
</script> | |
</div> <!-- /content --> | |
</body></html> |