{"id":1333,"date":"2025-06-19T09:27:05","date_gmt":"2025-06-19T00:27:05","guid":{"rendered":"https:\/\/beeknowledge.co.jp\/?p=1333"},"modified":"2025-06-19T09:27:07","modified_gmt":"2025-06-19T00:27:07","slug":"%e3%83%9e%e3%83%ab%e3%83%81%e3%83%a2%e3%83%bc%e3%83%80%e3%83%ab%e6%8a%80%e8%a1%93%e3%81%a7%e8%b6%a3%e5%91%b3%e5%86%99%e7%9c%9fx%e6%96%87%e7%ab%a0x%e9%9f%b3%e6%a5%bd%e3%82%92%e8%9e%8d","status":"publish","type":"post","link":"https:\/\/beeknowledge.co.jp\/?p=1333","title":{"rendered":"\u30de\u30eb\u30c1\u30e2\u30fc\u30c0\u30eb\u6280\u8853\u3067\u8da3\u5473\u5199\u771f\u00d7\u6587\u7ae0\u00d7\u97f3\u697d\u3092\u878d\u5408\u3059\u308b\u5275\u4f5c\u30ac\u30a4\u30c9"},"content":{"rendered":"<div class=\"veu_autoEyeCatchBox\"><img loading=\"lazy\" decoding=\"async\" width=\"1024\" height=\"1024\" src=\"https:\/\/beeknowledge.co.jp\/wp-content\/uploads\/2025\/06\/mnoby2m-1024x1024.jpg\" class=\"attachment-large size-large wp-post-image\" alt=\"\" srcset=\"https:\/\/beeknowledge.co.jp\/wp-content\/uploads\/2025\/06\/mnoby2m-1024x1024.jpg 1024w, https:\/\/beeknowledge.co.jp\/wp-content\/uploads\/2025\/06\/mnoby2m-300x300.jpg 300w, https:\/\/beeknowledge.co.jp\/wp-content\/uploads\/2025\/06\/mnoby2m-150x150.jpg 150w, https:\/\/beeknowledge.co.jp\/wp-content\/uploads\/2025\/06\/mnoby2m-768x768.jpg 768w, https:\/\/beeknowledge.co.jp\/wp-content\/uploads\/2025\/06\/mnoby2m-1536x1536.jpg 1536w, https:\/\/beeknowledge.co.jp\/wp-content\/uploads\/2025\/06\/mnoby2m-1080x1080.jpg 1080w, https:\/\/beeknowledge.co.jp\/wp-content\/uploads\/2025\/06\/mnoby2m.jpg 2048w\" sizes=\"(max-width: 1024px) 100vw, 1024px\" \/><\/div>\n<!DOCTYPE html>\n<html lang=\"ja\">\n<head>\n  <meta charset=\"UTF-8\">\n  <title>\u8da3\u5473\u5275\u4f5c\u3067\u6d3b\u304b\u3059\u30de\u30eb\u30c1\u30e2\u30fc\u30c0\u30eb\u751f\u6210AI\uff5c\u5199\u771f\u30fb\u97f3\u697d\u30fb\u6587\u7ae0\u306e\u878d\u5408\u30ac\u30a4\u30c9<\/title>\n  <meta name=\"viewport\" content=\"width=device-width, initial-scale=1\">\n  <meta name=\"description\" content=\"\u30de\u30eb\u30c1\u30e2\u30fc\u30c0\u30eb\u751f\u6210AI\u3067\u5199\u771f\u30fb\u30c6\u30ad\u30b9\u30c8\u30fb\u97f3\u697d\u3092\u878d\u5408\u3057\u305f\u5275\u4f5c\u30a2\u30a4\u30c7\u30a2\u3084\u5b9f\u8df5\u6cd5\u3001\u80cc\u666f\u3068\u5c55\u671b\u3092\u7d39\u4ecb\u3002\u8da3\u5473\u306eAI\u6d3b\u7528\u6cd5\u3092\u3084\u3055\u3057\u304f\u89e3\u8aac\u3002\">\n  <style>\n    body {\n      font-family: 'Segoe UI', 'Yu Gothic', 'Meiryo', sans-serif;\n      background: #f5f6fa;\n      margin: 0;\n      padding: 0;\n      color: #23242b;\n    }\n    header, footer {\n      background: #2d3e50;\n      color: #fff;\n      text-align: center;\n      padding: 1.5em 0 1em 0;\n      letter-spacing: 0.05em;\n    }\n    main {\n      background: #fff;\n      max-width: 740px;\n      margin: 32px auto 24px auto;\n      padding: 2em 1.5em 2.5em 1.5em;\n      border-radius: 12px;\n      box-shadow: 0 4px 16px rgba(60,64,67,0.10);\n    }\n    h1 {\n      font-size: 1.85em;\n      letter-spacing: 0.04em;\n      margin-bottom: 0.3em;\n    }\n    h2 {\n      font-size: 1.3em;\n      border-left: 6px solid #2062af;\n      padding-left: 0.6em;\n      margin-top: 2.2em;\n      margin-bottom: 0.7em;\n      color: #2062af;\n      background: #f0f4fa;\n    }\n    h3 {\n      font-size: 1.13em;\n      color: #25598c;\n      margin-top: 1.5em;\n      margin-bottom: 0.3em;\n      font-weight: 600;\n    }\n    ul, ol {\n      margin-left: 1.2em;\n      margin-bottom: 1em;\n    }\n    ul li, ol li {\n      margin-bottom: 0.5em;\n    }\n    a {\n      color: #2463b7;\n      text-decoration: underline;\n    }\n    a:hover {\n      background: #eaf1fa;\n    }\n    code, pre {\n      background: #f5f5f5;\n      border-radius: 4px;\n      font-size: 1em;\n      color: #234;\n      padding: 0.3em 0.6em;\n      line-height: 1.65;\n    }\n    pre {\n      display: block;\n      padding: 1em 1em;\n      margin: 1em 0 1.5em 0;\n      overflow-x: auto;\n      font-size: 0.98em;\n      background: #f5f7fb;\n      border: 1px solid #e3e6ed;\n    }\n    section {\n      margin-bottom: 2em;\n    }\n    @media (max-width: 600px) {\n      main { padding: 0.6em 0.2em; }\n      h1 { font-size: 1.22em; }\n      h2 { font-size: 1.07em; }\n      pre { font-size: 0.93em; }\n    }\n  <\/style>\n<\/head>\n<body>\n  <header>\n    <div>\u5199\u771f\u30fb\u97f3\u697d\u30fb\u6587\u7ae0\u306e\u878d\u5408\u30ac\u30a4\u30c9<\/div>\n  <\/header>\n  <main>\n    <section>\n      <h2>\u30de\u30eb\u30c1\u30e2\u30fc\u30c0\u30eb\u751f\u6210AI\u3068\u306f<\/h2>\n      <p>\n        \u30de\u30eb\u30c1\u30e2\u30fc\u30c0\u30eb\u751f\u6210AI\u306f\u3001<b>\u753b\u50cf\u30fb\u30c6\u30ad\u30b9\u30c8\u30fb\u97f3\u697d\u30fb\u52d5\u753b<\/b>\u306a\u3069\u8907\u6570\u306e\u5f62\u5f0f\u3092\u540c\u6642\u306b\u6271\u3044\u3001\u81ea\u5728\u306b\u7d44\u307f\u5408\u308f\u305b\u3066\u65b0\u3057\u3044\u4f5c\u54c1\u3092\u751f\u307f\u51fa\u3059\u6280\u8853\u3067\u3059\u3002\n        \u4f8b\u3068\u3057\u3066\u300c\u5199\u771f\u304b\u3089\u8a69\u7684\u306a\u30ad\u30e3\u30d7\u30b7\u30e7\u30f3\u751f\u6210\u300d\u300c\u30c6\u30ad\u30b9\u30c8\u304b\u3089\u97f3\u697d\u751f\u6210\u300d\u300c\u753b\u50cf\u3084\u97f3\u697d\u3092\u7d71\u5408\u3057\u305f\u81ea\u52d5\u52d5\u753b\u5236\u4f5c\u300d\u306a\u3069\u304c\u6319\u3052\u3089\u308c\u307e\u3059\u3002\n        <br>\n        <a href=\"https:\/\/convin.ai\/blog\/multimodal-generative-ai\" target=\"_blank\" rel=\"noopener\">\u89e3\u8aac\u8a18\u4e8b\uff08Convin\uff09<\/a>\n      <\/p>\n    <\/section>\n\n    <section>\n      <h2>\u6700\u65b0\u306e\u30c4\u30fc\u30eb\u30fb\u8ad6\u6587\u4e8b\u4f8b<\/h2>\n      <ul>\n        <li><b>\u753b\u50cf\u30ad\u30e3\u30d7\u30b7\u30e7\u30f3\u751f\u6210<\/b>\uff1a<a href=\"https:\/\/huggingface.co\/docs\/transformers\/model_doc\/blip\" target=\"_blank\">BLIP<\/a>\u3001CLIP<\/li>\n        <li><b>\u30c6\u30ad\u30b9\u30c8\u2192\u97f3\u697d\u751f\u6210<\/b>\uff1a\n          <a href=\"https:\/\/google-research.github.io\/seanet\/musiclm\/examples\/\" target=\"_blank\">MusicLM<\/a>\uff08Google\uff09\u3001\n          <a href=\"https:\/\/openai.com\/research\/publications\/jukebox\" target=\"_blank\">OpenAI Jukebox<\/a>\u3001\n          <a href=\"https:\/\/www.riffusion.com\/about\" target=\"_blank\">Riffusion<\/a>\n        <\/li>\n        <li><b>\u30de\u30eb\u30c1\u30e2\u30fc\u30c0\u30eb\u97f3\u697d\u751f\u6210\u8ad6\u6587<\/b>\uff1a\n          <ul>\n            <li><a href=\"https:\/\/arxiv.org\/abs\/2504.13891\" target=\"_blank\">Mozualization: Crafting Music and Visual Representation<\/a><\/li>\n            <li><a href=\"https:\/\/arxiv.org\/abs\/2412.18940\" target=\"_blank\">Amuse: Human-AI Collaborative Songwriting<\/a><\/li>\n            <li><a href=\"https:\/\/arxiv.org\/abs\/2504.13535\" target=\"_blank\">MusFlow: Multimodal Music Generation<\/a><\/li>\n            <li><a href=\"https:\/\/www.mdpi.com\/2079-9292\/14\/6\/1197\" target=\"_blank\">AI-Enabled Text-to-Music Generation: Review (MDPI)<\/a><\/li>\n          <\/ul>\n        <\/li>\n      <\/ul>\n    <\/section>\n\n    <section>\n      <h2>\u5275\u4f5c\u306e\u6d41\u308c\u3068Python\u5b9f\u8df5\u4f8b<\/h2>\n      <h3>1. \u5199\u771f\u304b\u3089\u30ad\u30e3\u30d7\u30b7\u30e7\u30f3\u751f\u6210\uff08BLIP\uff09<\/h3>\n      <pre><code>from transformers import BlipProcessor, BlipForConditionalGeneration\nfrom PIL import Image\nprocessor = BlipProcessor.from_pretrained(\"Salesforce\/blip-image-captioning-base\")\nmodel = BlipForConditionalGeneration.from_pretrained(\"Salesforce\/blip-image-captioning-base\")\nimg = Image.open(\"my_photo.jpg\").convert(\"RGB\")\ninputs = processor(img, return_tensors=\"pt\")\nout = model.generate(**inputs)\ncaption = processor.decode(out[0], skip_special_tokens=True)\nprint(\"\u751f\u6210\u30ad\u30e3\u30d7\u30b7\u30e7\u30f3:\", caption)\n<\/code><\/pre>\n\n      <h3>2. \u30ad\u30e3\u30d7\u30b7\u30e7\u30f3\u304b\u3089\u97f3\u697d\u751f\u6210\uff08MusicLM\u30fbRiffusion API\u4f8b\uff09<\/h3>\n      <pre><code># \u64ec\u4f3c\u4f8b\uff1aAPI\u4ed5\u69d8\u306f\u516c\u5f0f\u53c2\u7167\nfrom musicai import MusicGenerator\nmusic = MusicGenerator().generate(prompt=caption, duration=30)\nwith open(\"music.wav\", \"wb\") as f:\n    f.write(music)\n<\/code><\/pre>\n\n      <h3>3. \u753b\u50cf\uff0b\u97f3\u697d\uff0b\u6587\u7ae0\u3067\u52d5\u753b\u5316\uff08moviepy\uff09<\/h3>\n      <pre><code>from moviepy.editor import ImageClip, AudioFileClip\nimg_clip = ImageClip(\"my_photo.jpg\").set_duration(30)\naudio_clip = AudioFileClip(\"music.wav\")\nvideo = img_clip.set_audio(audio_clip)\nvideo.write_videofile(\"output.mp4\", fps=1)\n<\/code><\/pre>\n      <p style=\"font-size:0.93em;\">\u203bAPI\u306e\u5229\u7528\u6cd5\u306f\u5404\u30b5\u30fc\u30d3\u30b9\u516c\u5f0f\u30fb\u8ad6\u6587\u30da\u30fc\u30b8\u3092\u53c2\u7167\u304f\u3060\u3055\u3044\u3002<\/p>\n    <\/section>\n\n    <section>\n      <h2>\u80cc\u666f\u3068\u4eca\u5f8c\u306e\u5c55\u671b<\/h2>\n      <p>\n        \u8fd1\u5e74\u306eTransformer\u7cfbAI\u306e\u9032\u5316\u3068\u3001API\u3084OSS\u306e\u666e\u53ca\u3067\u500b\u4eba\u30ec\u30d9\u30eb\u3067\u3082\u8907\u6570\u30e2\u30c0\u30ea\u30c6\u30a3\u3092\u878d\u5408\u3057\u305f\u5275\u4f5c\u304c\u73fe\u5b9f\u306b\u306a\u3063\u3066\u3044\u307e\u3059\u3002\n        Mozualization\u3084Amuse\u3001MusFlow\u306a\u3069\u306e\u5148\u7aef\u7814\u7a76\u3082\u9032\u307f\u3001\u8ab0\u3067\u3082\u300c\u5199\u771f\u00d7\u8a00\u8449\u00d7\u97f3\u697d\u300d\u306e\u8907\u5408\u4f5c\u54c1\u3092\u751f\u307f\u51fa\u305b\u308b\u6642\u4ee3\u304c\u5230\u6765\u3057\u3066\u3044\u307e\u3059\u3002\n        \u4eca\u5f8c\u306f\u6559\u80b2\u30fbSNS\u30fb\u5730\u57df\u30a4\u30d9\u30f3\u30c8\u306a\u3069\u3001\u8868\u73fe\u624b\u6bb5\u304c\u3055\u3089\u306b\u591a\u69d8\u5316\u3057\u3001\u8457\u4f5c\u6a29\u30fb\u502b\u7406\u3068\u5411\u304d\u5408\u3044\u306a\u304c\u3089\u3082AI\u5275\u4f5c\u6587\u5316\u304c\u5e83\u304c\u308b\u3067\u3057\u3087\u3046\u3002\n      <\/p>\n    <\/section>\n\n    <section>\n      <h2>\u53c2\u8003\u30ea\u30f3\u30af\u96c6<\/h2>\n      <ul>\n        <li><a href=\"https:\/\/convin.ai\/blog\/multimodal-generative-ai\" target=\"_blank\">How Multimodal Generative AI Is Shaping the Future\uff08Convin\uff09<\/a><\/li>\n        <li><a href=\"https:\/\/www.mdpi.com\/2079-9292\/14\/6\/1197\" target=\"_blank\">AI-Enabled Text-to-Music Generation: Comprehensive Review (MDPI)<\/a><\/li>\n        <li><a href=\"https:\/\/arxiv.org\/abs\/2504.13891\" target=\"_blank\">Mozualization: Crafting Music and Visual Representation (arXiv)<\/a><\/li>\n        <li><a href=\"https:\/\/arxiv.org\/abs\/2412.18940\" target=\"_blank\">Amuse: Human\u2011AI Collaborative Songwriting (arXiv)<\/a><\/li>\n        <li><a href=\"https:\/\/arxiv.org\/abs\/2504.13535\" target=\"_blank\">MusFlow: Multimodal Music Generation (arXiv)<\/a><\/li>\n        <li><a href=\"https:\/\/openai.com\/research\/publications\/jukebox\" target=\"_blank\">OpenAI Jukebox<\/a><\/li>\n        <li><a href=\"https:\/\/www.riffusion.com\/about\" target=\"_blank\">Riffusion<\/a><\/li>\n      <\/ul>\n    <\/section>\n  <\/main>\n  <footer>\n    <small>\u00a9 2025 \u682a\u5f0f\u4f1a\u793e\u30d3\u30fc\u30fb\u30ca\u30ec\u30c3\u30b8\u30fb\u30c7\u30b6\u30a4\u30f3<\/small>\n  <\/footer>\n<\/body>\n<\/html>\n\n","protected":false},"excerpt":{"rendered":"<p>\u8da3\u5473\u5275\u4f5c\u3067\u6d3b\u304b\u3059\u30de\u30eb\u30c1\u30e2\u30fc\u30c0\u30eb\u751f\u6210AI\uff5c\u5199\u771f\u30fb\u97f3\u697d\u30fb\u6587\u7ae0\u306e\u878d\u5408\u30ac\u30a4\u30c9 \u5199\u771f\u30fb\u97f3\u697d\u30fb\u6587\u7ae0\u306e\u878d\u5408\u30ac\u30a4\u30c9 \u30de\u30eb\u30c1\u30e2\u30fc\u30c0\u30eb\u751f\u6210AI\u3068\u306f \u30de\u30eb\u30c1\u30e2\u30fc\u30c0\u30eb\u751f\u6210AI\u306f\u3001\u753b\u50cf\u30fb\u30c6\u30ad\u30b9\u30c8\u30fb\u97f3\u697d\u30fb\u52d5\u753b\u306a\u3069\u8907\u6570\u306e\u5f62\u5f0f\u3092\u540c\u6642\u306b\u6271\u3044\u3001\u81ea\u5728\u306b\u7d44\u307f\u5408 [&hellip;]<\/p>\n","protected":false},"author":1,"featured_media":1340,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"saved_in_kubio":false,"om_disable_all_campaigns":false,"_monsterinsights_skip_tracking":false,"_monsterinsights_sitenote_active":false,"_monsterinsights_sitenote_note":"","_monsterinsights_sitenote_category":0,"_uf_show_specific_survey":0,"_uf_disable_surveys":false,"jetpack_post_was_ever_published":false,"_jetpack_newsletter_access":"","_jetpack_dont_email_post_to_subs":false,"_jetpack_newsletter_tier_id":0,"_jetpack_memberships_contains_paywalled_content":false,"_jetpack_memberships_contains_paid_content":false,"vkexunit_cta_each_option":"","footnotes":""},"categories":[5,59,6,54],"tags":[],"class_list":["post-1333","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-ai","category-59","category-programing","category-54"],"aioseo_notices":[],"jetpack_featured_media_url":"https:\/\/beeknowledge.co.jp\/wp-content\/uploads\/2025\/06\/mnoby2m.jpg","jetpack_sharing_enabled":true,"_links":{"self":[{"href":"https:\/\/beeknowledge.co.jp\/index.php?rest_route=\/wp\/v2\/posts\/1333","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/beeknowledge.co.jp\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/beeknowledge.co.jp\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/beeknowledge.co.jp\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/beeknowledge.co.jp\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=1333"}],"version-history":[{"count":6,"href":"https:\/\/beeknowledge.co.jp\/index.php?rest_route=\/wp\/v2\/posts\/1333\/revisions"}],"predecessor-version":[{"id":1339,"href":"https:\/\/beeknowledge.co.jp\/index.php?rest_route=\/wp\/v2\/posts\/1333\/revisions\/1339"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/beeknowledge.co.jp\/index.php?rest_route=\/wp\/v2\/media\/1340"}],"wp:attachment":[{"href":"https:\/\/beeknowledge.co.jp\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=1333"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/beeknowledge.co.jp\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=1333"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/beeknowledge.co.jp\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=1333"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}