Batch chunks from ingest.py

This commit is contained in:
2026-03-24 21:37:41 +11:00
parent a0e1f2cd75
commit 8d1f6af9c1
20 changed files with 4142 additions and 0 deletions

184
out/754690268/chunks.json Normal file
View File

@@ -0,0 +1,184 @@
[
{
"video_id": "754690268",
"video_url": "https://vimeo.com/754690268",
"chapter_index": 0,
"timestamp": "0:00",
"timestamp_sec": 0,
"title": "Introduction and Q&A Format",
"summary": "Annie explains the session is conversational, not presentation-driven, encouraging participants to ask questions, share solutions, and engage on any topics of interest related to SecureTransport.",
"transcript": "",
"is_demo": false,
"frame_description": null,
"source": "ask-annie",
"series": "ST Best Practices Q&A"
},
{
"video_id": "754690268",
"video_url": "https://vimeo.com/754690268",
"chapter_index": 1,
"timestamp": "1:05",
"timestamp_sec": 65,
"title": "File Deletion Strategy for Client Servers",
"summary": "ST push cannot delete files on remote servers. For small file counts (<100/day), use pull with delete post-transfer via custom transfer site with scheduled pulls. For larger volumes, implement custom Java-based pluggable transfer site or use the API with external scheduling. SSH protocol in 5.5+ supports age-based file detection.",
"transcript": "",
"is_demo": false,
"frame_description": null,
"source": "ask-annie",
"series": "ST Best Practices Q&A"
},
{
"video_id": "754690268",
"video_url": "https://vimeo.com/754690268",
"chapter_index": 2,
"timestamp": "13:02",
"timestamp_sec": 782,
"title": "XML Export for Job Discovery",
"summary": "XML export provides accounts and subscriptions (jobs). The xml_export script in the bin directory exports configuration; never use the UI button as it can timeout and hang. Export accounts with or without routes depending on setup. Business logic must be documented separately; technical routing details are in the XML.",
"transcript": "",
"is_demo": false,
"frame_description": null,
"source": "ask-annie",
"series": "ST Best Practices Q&A"
},
{
"video_id": "754690268",
"video_url": "https://vimeo.com/754690268",
"chapter_index": 3,
"timestamp": "20:47",
"timestamp_sec": 1247,
"title": "XML Parsing and Subscription Visualization",
"summary": "Pull the complete_subscription tag, look for partner_in/partner_out sections within transfer_configuration; site references map sources and destinations. XSD schema is available in ST's conf folder for parser validation.",
"transcript": "",
"is_demo": false,
"frame_description": null,
"source": "ask-annie",
"series": "ST Best Practices Q&A"
},
{
"video_id": "754690268",
"video_url": "https://vimeo.com/754690268",
"chapter_index": 4,
"timestamp": "36:54",
"timestamp_sec": 2214,
"title": "Subscription Scheduling Failures and Recovery",
"summary": "If subscriptions fail without triggering, likely database corruption if cron job isn't in DB or is misconfigured. Don't delete/recreate \u2014 get support to investigate. Cron names are ID-based, not name-based. Upgrade from old 5.5 base builds may help.",
"transcript": "",
"is_demo": false,
"frame_description": null,
"source": "ask-annie",
"series": "ST Best Practices Q&A"
},
{
"video_id": "754690268",
"video_url": "https://vimeo.com/754690268",
"chapter_index": 5,
"timestamp": "42:51",
"timestamp_sec": 2571,
"title": "Multi-Subscription Single-Account Performance",
"summary": "No technical limit on subscriptions per account, but UI pages slow significantly at high counts. Latest releases include folder-lookup options (recursive vs linear) and a parameter to pre-assume folder existence if checked recently. For >13,000 folders, consider multi-account strategy with cross-account site references.",
"transcript": "",
"is_demo": false,
"frame_description": null,
"source": "ask-annie",
"series": "ST Best Practices Q&A"
},
{
"video_id": "754690268",
"video_url": "https://vimeo.com/754690268",
"chapter_index": 6,
"timestamp": "49:39",
"timestamp_sec": 2979,
"title": "Migration Between Servers with OS Changes",
"summary": "Do not use system export when migrating with OS change \u2014 it's OS-tied and can corrupt the destination. Instead use XML export for accounts/routes, then use API (GET/PUT) to migrate restrictions and access controls. API approach avoids OS-dependent artifacts.",
"transcript": "",
"is_demo": false,
"frame_description": null,
"source": "ask-annie",
"series": "ST Best Practices Q&A"
},
{
"video_id": "754690268",
"video_url": "https://vimeo.com/754690268",
"chapter_index": 7,
"timestamp": "52:42",
"timestamp_sec": 3162,
"title": "Shared Storage Selection (NFS vs GPFS vs GFS2)",
"summary": "For Linux: GPFS (IBM) is best but expensive; GFS2 is good; NFS is easiest and supports most use cases (~90% of environments use NFS). For Windows: SMB shares are fastest. Selection depends on transfer volume, file size, and node count. Consult capacity guide for performance tables.",
"transcript": "",
"is_demo": false,
"frame_description": null,
"source": "ask-annie",
"series": "ST Best Practices Q&A"
},
{
"video_id": "754690268",
"video_url": "https://vimeo.com/754690268",
"chapter_index": 8,
"timestamp": "59:04",
"timestamp_sec": 3544,
"title": "Fine-Tuning and Capacity Planning Approach",
"summary": "Start with the support portal article 'Tuning for Secure Transport.' Use baseline recommendations from capacity guide, adjust for known customer behavior. Fine-tune iteratively with load testing. Monitor errors daily \u2014 single transfer failures can signal tuning needs.",
"transcript": "",
"is_demo": false,
"frame_description": null,
"source": "ask-annie",
"series": "ST Best Practices Q&A"
},
{
"video_id": "754690268",
"video_url": "https://vimeo.com/754690268",
"chapter_index": 9,
"timestamp": "62:15",
"timestamp_sec": 3735,
"title": "Subscription-Level and Scenario Tuning",
"summary": "Beyond server tuning, adjust individual subscriptions: connection count, thread pool size. Stagger scheduler times to avoid 3AM clustering. Reduce connection count to error-prone partners to lower bandwidth but increase reliability. Fine-tuning is continuous; system changes require re-tuning every 2 months.",
"transcript": "",
"is_demo": false,
"frame_description": null,
"source": "ask-annie",
"series": "ST Best Practices Q&A"
},
{
"video_id": "754690268",
"video_url": "https://vimeo.com/754690268",
"chapter_index": 10,
"timestamp": "67:46",
"timestamp_sec": 4066,
"title": "Server Restart Issues on Linux (May Update)",
"summary": "When restarting Linux servers, HTTP (stateless) starts before database readiness, causing some services to fail. Solution: add sleep delay (1.5-2 seconds) in start_db script or before start_http in the startup sequence. SSH doesn't have this issue because it's stateful and detects database unavailability.",
"transcript": "",
"is_demo": false,
"frame_description": null,
"source": "ask-annie",
"series": "ST Best Practices Q&A"
},
{
"video_id": "754690268",
"video_url": "https://vimeo.com/754690268",
"chapter_index": 11,
"timestamp": "72:30",
"timestamp_sec": 4350,
"title": "Windows Startup Service Ordering",
"summary": "Never set ST services to automatic startup on Windows \u2014 they start in wrong order. Create a wrapper service that calls start_all with a sleep delay before it. Linux doesn't have this issue; use startup scripts with sleep directly.",
"transcript": "",
"is_demo": false,
"frame_description": null,
"source": "ask-annie",
"series": "ST Best Practices Q&A"
},
{
"video_id": "754690268",
"video_url": "https://vimeo.com/754690268",
"chapter_index": 12,
"timestamp": "76:41",
"timestamp_sec": 4601,
"title": "Load Testing Approaches and Tools",
"summary": "No single recommended tool; Axway uses expensive proprietary tools internally. For simple tests, write custom scripts to send 10,000+ files and open 20 connections concurrently. For comprehensive testing with metrics, research open-source packages or ask community forum.",
"transcript": "",
"is_demo": false,
"frame_description": null,
"source": "ask-annie",
"series": "ST Best Practices Q&A"
}
]