<?xml version="1.0" encoding="UTF-8"?>
<feed xmlns="http://www.w3.org/2005/Atom">
    <title>vlm</title>
    <link rel="self" type="application/atom+xml" href="https://links.biapy.com/guest/tags/3440/feed"/>
    <updated>2026-04-30T04:25:08+00:00</updated>
    <id>https://links.biapy.com/guest/tags/3440/feed</id>
            <entry>
            <id>https://links.biapy.com/links/12402</id>
            <title type="text"><![CDATA[Granite 4.0 3B Vision]]></title>
            <link rel="alternate" href="https://huggingface.co/ibm-granite/granite-4.0-3b-vision" />
            <link rel="via" type="application/atom+xml" href="https://links.biapy.com/links/12402"/>
            <author>
                <name><![CDATA[Biapy]]></name>
            </author>
            <summary type="text">
                <![CDATA[Granite-4.0-3B-Vision is a vision-language model (VLM) designed for enterprise-grade document data extraction. It focuses on specialized, complex extraction tasks that ultracompact models often struggle with.

Related contents:

- [Granite 4.0 3B Vision: Compact Multimodal Intelligence for Enterprise Documents  @ Hugging Face](https://huggingface.co/blog/ibm-granite/granite-4-vision).]]>
            </summary>
            <updated>2026-04-03T14:29:59+00:00</updated>
        </entry>
    </feed>
