File size: 5,081 Bytes
d8d37b0 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 |
<!DOCTYPE html>
<html lang="en">
<head>
<meta charset="UTF-8">
<title>Image to Text - Hugging Face Transformers.js</title>
<script type="module">
// Import the library
import { pipeline } from 'https://cdn.jsdelivr.net/npm/@xenova/[email protected]';
// Make it available globally
window.pipeline = pipeline;
</script>
<link href="https://cdn.jsdelivr.net/npm/[email protected]/dist/css/bootstrap.min.css" rel="stylesheet">
<link rel="stylesheet" href="css/styles.css"></head>
<body>
<div class="container-main">
<!-- Page Header -->
<div class="header">
<div class="header-logo">
<img src="images/logo.png" alt="logo">
</div>
<div class="header-main-text">
<h1>Hugging Face Transformers.js</h1>
</div>
<div class="header-sub-text">
<h3>Free AI Models for JavaScript Web Development</h3>
</div>
</div>
<hr> <!-- Separator -->
<!-- Back to Home button -->
<div class="row mt-5">
<div class="col-md-12 text-center">
<a href="index.html" class="btn btn-outline-secondary"
style="color: #3c650b; border-color: #3c650b;">Back to Main Page</a>
</div>
</div>
<!-- Content -->
<div class="container mt-5">
<!-- Centered Titles -->
<div class="text-center">
<h2>Computer Vision</h2>
<h4>Image to Text</h4>
</div>
<!-- Actual Content of this page -->
<div id="image-to-text-container" class="container mt-4">
<h5>Generate a Caption for an Image w/ Xenova/vit-gpt2-image-captionin:</h5>
<div class="d-flex align-items-center">
<label for="imageToTextURLText" class="mb-0 text-nowrap" style="margin-right: 15px;">Enter
image to Caption URL:</label>
<input type="text" class="form-control flex-grow-1" id="imageToTextURLText"
value="https://huggingface.co/datasets/Xenova/transformers.js-docs/resolve/main/cats.jpg"
placeholder="Enter image" style="margin-right: 15px; margin-left: 15px;">
<button id="ImagetoTextButton" class="btn btn-primary" onclick="captionImage()">Caption</button>
</div>
<div class="mt-4">
<h4>Output:</h4>
<pre id="outputArea"></pre>
</div>
</div>
<hr> <!-- Line Separator -->
<div id="image-to-text-local-container" class="container mt-4">
<h5>Generate a Caption for a Local Image:</h5>
<div class="d-flex align-items-center">
<label for="imagetoTextLocalFile" class="mb-0 text-nowrap"
style="margin-right: 15px;">Select Local Image:</label>
<input type="file" id="imagetoTextLocalFile" accept="image/*" />
<button id="CaptionButtonLocal" class="btn btn-primary"
onclick="captionImageLocal()">Caption</button>
</div>
<div class="mt-4">
<h4>Output:</h4>
<pre id="outputAreaLocal"></pre>
</div>
</div>
<!-- Back to Home button -->
<div class="row mt-5">
<div class="col-md-12 text-center">
<a href="index.html" class="btn btn-outline-secondary"
style="color: #3c650b; border-color: #3c650b;">Back to Main Page</a>
</div>
</div>
</div>
</div>
<script>
let captioner;
// Initialize the sentiment analysis model
async function initializeModel() {
captioner = await pipeline('image-to-text', 'Xenova/vit-gpt2-image-captioning');
}
async function captionImage() {
const textFieldValue = document.getElementById("imageToTextURLText").value.trim();
const result = await captioner(textFieldValue);
document.getElementById("outputArea").innerText = JSON.stringify(result, null, 2);
}
async function captionImageLocal() {
const fileInput = document.getElementById("imagetoTextLocalFile");
const file = fileInput.files[0];
if (!file) {
alert('Please select an image file first.');
return;
}
// Create a Blob URL from the file
const url = URL.createObjectURL(file);
const result = await captioner(url);
document.getElementById("outputAreaLocal").innerText = JSON.stringify(result, null, 2);
}
// Initialize the model after the DOM is completely loaded
window.addEventListener("DOMContentLoaded", initializeModel);
</script>
</body>
</html> |