Lightweight YouTube transcript extraction and YouTube search for apps that want video text and metadata first, then decide what to do with it. Built with TypeScript and zero runtime dependencies.
node --version # requires Node.js 18+
npm install yt-transcript-kitUse npx yt-transcript-kit --help for the CLI without installing globally.
import { fetchYouTubeTranscript, searchYouTube } from 'yt-transcript-kit';
const result = await fetchYouTubeTranscript('https://www.youtube.com/watch?v=dQw4w9WgXcQ');
console.log(result.title, result.fullText);
const videos = await searchYouTube({ query: 'typescript tutorial', maxResults: 5 });
console.log(videos[0].title, videos[0].url);Search YouTube videos without a YouTube Data API key.
import { searchYouTube } from 'yt-transcript-kit';
const results = await searchYouTube({
query: 'node.js streams',
maxResults: 10,
hl: 'en',
});
for (const video of results) {
console.log(video.title);
console.log(video.channelName, video.duration, video.viewCount);
console.log(video.url);
}Each result includes:
videoIdtitlechannelNamechannelIdpublishedAtviewCountdurationdurationSecondsthumbnailUrldescriptionurl
Fetch transcripts for search results in one call.
import { searchYouTubeWithTranscripts } from 'yt-transcript-kit';
const results = await searchYouTubeWithTranscripts({
query: 'react server components',
maxResults: 3,
includeTranscripts: true,
transcriptOptions: {
languages: ['en'],
},
});
for (const video of results) {
if (video.transcript) {
console.log(video.title, video.transcript.fullText.slice(0, 200));
} else {
console.warn(video.title, video.transcriptError);
}
}includeTranscripts: true makes one transcript request per search result, so keep maxResults modest for CLI tools and server routes.
import { fetchYouTubeTranscript, searchTranscript } from 'yt-transcript-kit';
const transcript = await fetchYouTubeTranscript('videoId');
const matches = searchTranscript(transcript, 'keyword', {
caseSensitive: false,
maxResults: 20,
contextChars: 24,
});
console.log(matches[0]);import { fetchYouTubeTranscript, chunkTranscript } from 'yt-transcript-kit';
const transcript = await fetchYouTubeTranscript('videoId');
const chunks = chunkTranscript(transcript, {
maxChars: 4000,
maxTokens: 1200,
overlapSegments: 1,
mergeAdjacentShortSegments: true,
});
console.log(chunks[0]);import { fetchYouTubeTranscript, formatTranscript } from 'yt-transcript-kit';
const transcript = await fetchYouTubeTranscript('videoId');
const plainText = formatTranscript(transcript, { mode: 'plainText' });
const markdown = formatTranscript(transcript, { mode: 'markdown', includeTimestamps: true });
const paragraphs = formatTranscript(transcript, { mode: 'paragraphs', paragraphMergeThresholdSec: 2 });
const segments = formatTranscript(transcript, { mode: 'segments' });
console.log(markdown);import { getTranscriptWithMetadata } from 'yt-transcript-kit';
const enriched = await getTranscriptWithMetadata('videoId');
console.log(enriched.channelName, enriched.duration, enriched.thumbnailUrls);import { fetchYouTubeTranscript, InMemoryTranscriptCache } from 'yt-transcript-kit';
const cache = new InMemoryTranscriptCache({ ttlMs: 60_000 });
const transcript = await fetchYouTubeTranscript('videoId', { cache });
console.log(transcript.videoId);import { fetchManyYouTubeTranscripts } from 'yt-transcript-kit';
const results = await fetchManyYouTubeTranscripts(['videoId1', 'videoId2'], { concurrency: 3 });
for (const item of results) {
if (item.success) {
console.log(item.result.videoId, item.result.languageCode);
} else {
console.error(item.input, item.error.code);
}
}import {
cleanTranscriptSegments,
cleanTranscriptText,
fetchYouTubeTranscript,
} from 'yt-transcript-kit';
const transcript = await fetchYouTubeTranscript('videoId');
const cleanedText = cleanTranscriptText(transcript, {
stripBracketedMarkers: true,
dedupeAdjacentLines: true,
});
const cleanedSegments = cleanTranscriptSegments(transcript.segments, {
normalizeWhitespace: true,
});
console.log(cleanedText, cleanedSegments.length);npx yt-transcript-kit <url>
npx yt-transcript-kit <url> --format txt
npx yt-transcript-kit <url> --format json
npx yt-transcript-kit <url> --format markdown
npx yt-transcript-kit <url> --languages de,en
npx yt-transcript-kit <url> --search "keyword"
npx yt-transcript-kit <url> --chunks --max-chars 4000
npx yt-transcript-kit batch urls.txt --format json
npx yt-transcript-kit batch urls.txt --concurrency 3
npx yt-transcript-kit search "typescript tutorial" --max-results 5
npx yt-transcript-kit search "typescript tutorial" --format json
npx yt-transcript-kit search "typescript tutorial" --transcripts --languages enUse --help to print command help.
Typical CLI uses:
--searchprints matching transcript segments with their segment index.--chunksprints chunked transcript text, or structured JSON when combined with--format json.batch <file> --format jsonreturns per-input success or failure records.search <query>prints video metadata and URLs from YouTube search results.search <query> --transcriptsalso attempts to fetch a transcript for each returned video.
INVALID_VIDEO_ID, VIDEO_UNAVAILABLE, RATE_LIMITED, NO_TRANSCRIPT, LANGUAGE_NOT_AVAILABLE, REQUEST_FAILED, EMPTY_QUERY, SEARCH_FAILED.
- Node.js
18+is required. - Standard browsers are not supported because YouTube transcript requests are blocked by CORS.
- Server runtimes, CLIs, browser extensions, and React Native are the intended environments.
npm run build
npm run typecheck
npm run test