Skip to content

Commit

Permalink
Merge pull request #20 from lamalab-org/Beyond_images
Browse files Browse the repository at this point in the history
edited cleaning notebook; added beyond image script
  • Loading branch information
marawilhelmi authored Jun 3, 2024
2 parents 452b4ce + bcb6342 commit a16e4c6
Show file tree
Hide file tree
Showing 13 changed files with 3,920 additions and 43 deletions.
79 changes: 79 additions & 0 deletions VLMs.drawio
Original file line number Diff line number Diff line change
@@ -0,0 +1,79 @@
<mxfile host="app.diagrams.net" modified="2024-05-30T10:35:27.701Z" agent="Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/16.6 Safari/605.1.15" etag="SSOQSFM1PfSLfv0epuuk" version="24.4.10" type="github">
<diagram name="Seite-1" id="zDdVwDyc1Fwn5zu0NveK">
<mxGraphModel dx="1224" dy="816" grid="1" gridSize="10" guides="1" tooltips="1" connect="1" arrows="1" fold="1" page="1" pageScale="1" pageWidth="827" pageHeight="1169" math="0" shadow="0">
<root>
<mxCell id="0" />
<mxCell id="1" parent="0" />
<mxCell id="O20LecAtxoyKpuHzmxib-49" value="" style="group;fontSize=11;verticalAlign=top;" parent="1" vertex="1" connectable="0">
<mxGeometry x="7" y="90" width="703" height="220" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-36" value="&lt;h3&gt;Text prompt&lt;/h3&gt;" style="html=1;shadow=0;dashed=0;align=center;verticalAlign=top;shape=mxgraph.arrows2.arrow;dy=0;dx=30;notch=30;fontFamily=Lucida Console;fontSize=11;fillColor=#f5f5f5;fontColor=#333333;strokeColor=#666666;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="388.3646341463415" y="132" width="114.02317073170731" height="88" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-35" value="&lt;h3&gt;Image prompt&lt;/h3&gt;" style="html=1;shadow=0;dashed=0;align=center;verticalAlign=top;shape=mxgraph.arrows2.arrow;dy=0;dx=30;notch=30;fontFamily=Lucida Console;fontSize=11;fillColor=#f5f5f5;fontColor=#333333;strokeColor=#666666;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;spacingBottom=23;spacing=0;spacingLeft=6;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="388.3646341463415" y="35.2" width="114.02317073170731" height="88" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-34" value="&lt;h3&gt;Base-64&lt;/h3&gt;" style="html=1;shadow=0;dashed=0;align=center;verticalAlign=top;shape=mxgraph.arrows2.arrow;dy=0;dx=30;notch=30;fontFamily=Lucida Console;fontSize=11;fillColor=#f5f5f5;fontColor=#333333;strokeColor=#666666;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="291.48780487804873" y="35.2" width="114.02317073170731" height="88" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-33" value="&lt;h3&gt;Data cleaning&lt;/h3&gt;" style="html=1;shadow=0;dashed=0;align=center;verticalAlign=top;shape=mxgraph.arrows2.arrow;dy=0;dx=30;notch=30;fontFamily=Lucida Console;fontSize=11;fillColor=#f5f5f5;fontColor=#333333;strokeColor=#666666;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;spacingLeft=7;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="195.36541463414633" y="35.2" width="114.02317073170731" height="88" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-32" value="&lt;h3&gt;Images&lt;/h3&gt;" style="html=1;shadow=0;dashed=0;align=center;verticalAlign=top;shape=mxgraph.arrows2.arrow;dy=0;dx=30;notch=30;fontFamily=Lucida Console;fontSize=11;fillColor=#f5f5f5;fontColor=#333333;strokeColor=#666666;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="96.87682926829268" y="35.2" width="114.02317073170731" height="88" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-6" value="&lt;h3&gt;PDF&lt;/h3&gt;" style="html=1;shadow=0;dashed=0;align=center;verticalAlign=top;shape=mxgraph.arrows2.arrow;dy=0;dx=30;notch=30;fontFamily=Lucida Console;fontSize=11;fillColor=#f5f5f5;fontColor=#333333;strokeColor=#666666;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry y="35.2" width="114.02317073170731" height="88" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-9" value="" style="outlineConnect=0;dashed=0;verticalLabelPosition=bottom;verticalAlign=top;align=center;html=1;shape=mxgraph.aws3.documents;fillColor=#647687;fontColor=#ffffff;strokeColor=#314354;fontFamily=Lucida Console;fontSize=11;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="35.578658536585365" y="73.08000000000001" width="42.86585365853659" height="46.64000000000001" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-11" value="" style="outlineConnect=0;dashed=0;verticalLabelPosition=bottom;verticalAlign=top;align=center;html=1;shape=mxgraph.aws3.filtering_rule;fillColor=#647687;fontColor=#ffffff;strokeColor=#314354;fontFamily=Lucida Console;fontSize=11;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="230.19820731707316" y="70.4" width="44.36615853658537" height="49.28000000000001" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-15" value="" style="shape=mxgraph.signs.tech.camera_2;html=1;pointerEvents=1;fillColor=#647687;strokeColor=none;verticalLabelPosition=bottom;verticalAlign=top;align=center;sketch=0;fontColor=#ffffff;fontFamily=Lucida Console;fontSize=11;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="128.5461219512195" y="80.52000000000002" width="50.68458536585365" height="39.160000000000004" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-16" value="" style="outlineConnect=0;dashed=0;verticalLabelPosition=bottom;verticalAlign=top;align=center;html=1;shape=mxgraph.aws3.automation;fillColor=#647687;fontColor=#ffffff;strokeColor=#314354;fontFamily=Lucida Console;fontSize=11;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="325.780487804878" y="70.84000000000002" width="46.29512195121951" height="46.64000000000001" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-25" value="" style="outlineConnect=0;dashed=0;verticalLabelPosition=bottom;verticalAlign=top;align=center;html=1;shape=mxgraph.aws3.assignment_task;fillColor=#647687;fontColor=#ffffff;strokeColor=#314354;fontFamily=Lucida Console;fontSize=11;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="433.3737804878049" y="72.16000000000001" width="34.29268292682927" height="44" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-27" value="" style="outlineConnect=0;dashed=0;verticalLabelPosition=bottom;verticalAlign=top;align=center;html=1;shape=mxgraph.aws3.requester;fillColor=#647687;fontColor=#ffffff;strokeColor=#314354;fontFamily=Lucida Console;fontSize=11;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="428.2298780487805" y="172.24" width="34.29268292682927" height="44" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-28" value="&lt;h1&gt;VLM&lt;/h1&gt;" style="html=1;shadow=0;dashed=0;align=center;verticalAlign=top;shape=mxgraph.arrows2.arrow;dy=0;dx=30;notch=0;fontFamily=Lucida Console;fontSize=11;fillColor=#bac8d3;strokeColor=#23445d;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;spacingRight=9;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="574.4024390243903" y="35.2" width="128.59756097560975" height="184.8" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-31" value="" style="outlineConnect=0;dashed=0;verticalLabelPosition=bottom;verticalAlign=top;align=center;html=1;shape=mxgraph.aws3.ec2;fillColor=#647687;fontColor=#ffffff;strokeColor=#314354;fontFamily=Lucida Console;fontSize=11;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="599.9076219512194" y="111.32000000000001" width="65.58475609756098" height="81.84000000000002" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-37" value="&lt;h3 style=&quot;line-height: 10%;&quot;&gt;Image&amp;nbsp;&lt;/h3&gt;&lt;h3 style=&quot;line-height: 10%;&quot;&gt;Encoder&lt;/h3&gt;" style="html=1;shadow=0;dashed=0;align=center;verticalAlign=top;shape=mxgraph.arrows2.arrow;dy=0;dx=0;notch=30;fontFamily=Lucida Console;fontSize=11;fillColor=#bac8d3;strokeColor=#23445d;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;spacingLeft=19;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="483.95548780487803" y="35.2" width="84.44573170731707" height="88" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-38" value="&lt;h3 style=&quot;line-height: 30%;&quot;&gt;Text&lt;/h3&gt;&lt;h3 style=&quot;line-height: 30%;&quot;&gt;Decoder&lt;/h3&gt;" style="html=1;shadow=0;dashed=0;align=center;verticalAlign=top;shape=mxgraph.arrows2.arrow;dy=0;dx=0;notch=30;fontFamily=Lucida Console;fontSize=11;fillColor=#bac8d3;strokeColor=#23445d;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;spacingLeft=21;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="485.8844512195122" y="132" width="82.51676829268293" height="88" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-41" value="" style="outlineConnect=0;dashed=0;verticalLabelPosition=bottom;verticalAlign=top;align=center;html=1;shape=mxgraph.aws3.instances_2;fillColor=#647687;fontColor=#ffffff;strokeColor=#314354;fontSize=11;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="514.19" y="80.44" width="39.83" height="37.04" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-43" value="" style="outlineConnect=0;dashed=0;verticalLabelPosition=bottom;verticalAlign=top;align=center;html=1;shape=mxgraph.aws3.search_documents;fillColor=#647687;fontColor=#ffffff;strokeColor=#314354;fontSize=11;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="516.9621951219511" y="181.04000000000002" width="34.29268292682927" height="35.2" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-44" value="" style="shape=crossbar;whiteSpace=wrap;html=1;rounded=1;strokeWidth=2;fillColor=#647687;strokeColor=#000000;fontColor=#ffffff;fontSize=11;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry y="14.960000000000003" width="474.0963414634146" height="17.6" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-46" value="Preprocessing" style="text;html=1;align=center;verticalAlign=middle;resizable=0;points=[];autosize=1;strokeColor=none;fillColor=none;fontFamily=Lucida Console;fontSize=11;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="204.75487804878048" width="90" height="30" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-47" value="" style="shape=crossbar;whiteSpace=wrap;html=1;rounded=1;strokeWidth=2;fillColor=#647687;strokeColor=#000000;fontColor=#ffffff;fontSize=11;movable=1;resizable=1;rotatable=1;deletable=1;editable=1;locked=0;connectable=1;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="483.95548780487803" y="14.960000000000003" width="195.89695121951218" height="17.6" as="geometry" />
</mxCell>
<mxCell id="O20LecAtxoyKpuHzmxib-48" value="VLM model call" style="text;html=1;align=center;verticalAlign=middle;resizable=0;points=[];autosize=1;strokeColor=none;fillColor=none;fontFamily=Lucida Console;fontSize=11;" parent="O20LecAtxoyKpuHzmxib-49" vertex="1">
<mxGeometry x="540.4649390243903" width="100" height="30" as="geometry" />
</mxCell>
</root>
</mxGraphModel>
</diagram>
</mxfile>
1 change: 1 addition & 0 deletions _quarto.yml
Original file line number Diff line number Diff line change
Expand Up @@ -15,6 +15,7 @@ book:
- obtaining_data/annotation.ipynb
- constrained_decoding/index.ipynb
- document_parsing_and_cleaning/document_parsing_and_cleaning.qmd
- beyond_text/beyond_images.ipynb

- part: Case Studies
chapters:
Expand Down
Loading

0 comments on commit a16e4c6

Please sign in to comment.