{"id":50410,"date":"2023-08-08T16:53:03","date_gmt":"2024-01-26T13:34:42","guid":{"rendered":"https:\/\/www.silicloud.com\/zh\/blog\/%e5%b0%9d%e8%af%95%e5%9c%a8databricks%e7%9a%84llm%e4%bc%98%e5%8c%96%e6%a8%a1%e5%9e%8b%e6%9c%8d%e5%8a%a1%e4%b8%ad%e9%83%a8%e7%bd%b2llama2%e6%a8%a1%e5%9e%8b%e3%80%82\/"},"modified":"2024-04-30T17:35:43","modified_gmt":"2024-04-30T09:35:43","slug":"%e5%b0%9d%e8%af%95%e5%9c%a8databricks%e7%9a%84llm%e4%bc%98%e5%8c%96%e6%a8%a1%e5%9e%8b%e6%9c%8d%e5%8a%a1%e4%b8%ad%e9%83%a8%e7%bd%b2llama2%e6%a8%a1%e5%9e%8b%e3%80%82","status":"publish","type":"post","link":"https:\/\/www.silicloud.com\/zh\/blog\/%e5%b0%9d%e8%af%95%e5%9c%a8databricks%e7%9a%84llm%e4%bc%98%e5%8c%96%e6%a8%a1%e5%9e%8b%e6%9c%8d%e5%8a%a1%e4%b8%ad%e9%83%a8%e7%bd%b2llama2%e6%a8%a1%e5%9e%8b%e3%80%82\/","title":{"rendered":"\u5c1d\u8bd5\u5728Databricks\u7684LLM\u4f18\u5316\u6a21\u578b\u670d\u52a1\u4e2d\u90e8\u7f72Llama2\u6a21\u578b"},"content":{"rendered":"<p>\u6211\u4f1a\u4e3a\u60a8\u8fdb\u884c\u6d4f\u89c8\u8fd9\u4e2a\u793a\u4f8b\u7b14\u8bb0\u672c\u3002<\/p>\n<p>&nbsp;<\/p>\n<h1>Llama2\u670d\u52a1\u7684\u4f18\u5316\u793a\u4f8b<\/h1>\n<p>\u901a\u8fc7\u6700\u4f18\u5316LLM\u4fdd\u5b58\uff0c\u60a8\u53ef\u4ee5\u5c06Databricks\u6a21\u578b\u670d\u52a1\u90e8\u7f72\u5230\u5177\u6709\u81ea\u52a8\u4f18\u5316\u529f\u80fd\u7684\u6700\u65b0OSS LLM\u548cGPU\uff0c\u4ee5\u63d0\u4f9b\u6539\u8fdb\u7684\u5ef6\u8fdf\u548c\u541e\u5410\u91cf\u3002\u76ee\u524d\uff0c\u6211\u4eec\u652f\u6301Llama2\u548cMosaic MPT\u7c7b\u6a21\u578b\u7684\u4f18\u5316\u3002<\/p>\n<p>\u5728\u8fd9\u4e2a\u793a\u4f8b\u4e2d\uff0c\u6211\u4eec\u5c06\u6f14\u793a\u4ee5\u4e0b\u5185\u5bb9:<\/p>\n<ol>\n<li style=\"list-style-type: none;\">\n<ol>\u4eceHugging Face transformers\u4e0b\u8f7d\u6a21\u578b<\/ol>\n<\/li>\n<\/ol>\n<p>&nbsp;<\/p>\n<ol>\n<li style=\"list-style-type: none;\">\n<ol>\u5c06\u6a21\u578b\u8bb0\u5f55\u5728Databricks\u7684Unity Catalog\u6216Workspace Registry\u4e2d\uff0c\u4ee5\u4f18\u5316\u7684serving\u652f\u6301\u683c\u5f0f<\/ol>\n<\/li>\n<\/ol>\n<p>&nbsp;<\/p>\n<ol>\u542f\u7528\u6a21\u578b\u7684\u4f18\u5316serving\u3002<\/ol>\n<h2>\u524d\u7f6e\u6761\u4ef6<\/h2>\n<ul class=\"post-ul\">\n<li style=\"list-style-type: none;\">\n<ul class=\"post-ul\">\u30ce\u30fc\u30c8\u30d6\u30c3\u30af\u3092\u5341\u5206\u306a\u30e1\u30e2\u30ea\u30fc\u3092\u6301\u3064\u30af\u30e9\u30b9\u30bf\u30fc\u306b\u30a2\u30bf\u30c3\u30c1<\/ul>\n<\/li>\n<\/ul>\n<p>&nbsp;<\/p>\n<ul class=\"post-ul\">\n<li style=\"list-style-type: none;\">\n<ul class=\"post-ul\">MLflow\u30d0\u30fc\u30b8\u30e7\u30f32.7.0\u4ee5\u964d\u304c\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u3055\u308c\u3066\u3044\u308b\u3053\u3068<\/ul>\n<\/li>\n<\/ul>\n<p>&nbsp;<\/p>\n<ul class=\"post-ul\">7B\u4ee5\u4e0a\u306e\u30b5\u30a4\u30ba\u306e\u30e2\u30c7\u30eb\u3092\u53d6\u308a\u6271\u3046\u969b\u306b\u306f\u7279\u306bUC\u3067\u306e\u30e2\u30c7\u30eb\u7ba1\u7406\u3092\u884c\u3046\u3053\u3068<\/ul>\n<h1>\u6b65\u9aa41\uff1a\u4e3a\u4e86\u4f18\u5316LLM\u5b58\u50a8\uff0c\u8bb0\u5f55\u6a21\u578b\u3002<\/h1>\n<pre class=\"post-pre\"><code><span class=\"c1\"># \u5fc5\u8981\u306a\u4f9d\u5b58\u95a2\u4fc2\u3092\u66f4\u65b0\/\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\r\n<\/span><span class=\"err\">!<\/span><span class=\"n\">pip<\/span> <span class=\"n\">install<\/span> <span class=\"o\">-<\/span><span class=\"n\">U<\/span> <span class=\"n\">mlflow<\/span>\r\n<span class=\"err\">!<\/span><span class=\"n\">pip<\/span> <span class=\"n\">install<\/span> <span class=\"o\">-<\/span><span class=\"n\">U<\/span> <span class=\"n\">transformers<\/span>\r\n<span class=\"err\">!<\/span><span class=\"n\">pip<\/span> <span class=\"n\">install<\/span> <span class=\"o\">-<\/span><span class=\"n\">U<\/span> <span class=\"n\">accelerate<\/span>\r\n<span class=\"err\">!<\/span><span class=\"n\">pip<\/span> <span class=\"n\">install<\/span> <span class=\"o\">-<\/span><span class=\"n\">U<\/span> <span class=\"n\">flash_attn<\/span> <span class=\"c1\"># DBR 13.3 ML\u3067\u30a8\u30e9\u30fc\u306b\u306a\u3063\u305f\u306e\u3067\u8ffd\u52a0\r\n<\/span><span class=\"n\">dbutils<\/span><span class=\"p\">.<\/span><span class=\"n\">library<\/span><span class=\"p\">.<\/span><span class=\"nf\">restartPython<\/span><span class=\"p\">()<\/span>\r\n<\/code><\/pre>\n<p>\u8f93\u5165 Hugging Face \u7684\u4ee4\u724c\u3002\u66f4\u591a\u8be6\u60c5\u8bf7\u70b9\u51fb\u6b64\u5904\u3002<\/p>\n<pre class=\"post-pre\"><code><span class=\"kn\">import<\/span> <span class=\"n\">huggingface_hub<\/span>\r\n<span class=\"c1\"># \u65e2\u306bhugging face\u306b\u30ed\u30b0\u30a4\u30f3\u3057\u3066\u3044\u308b\u969b\u306b\u306f\u30b9\u30ad\u30c3\u30d7\r\n<\/span><span class=\"n\">huggingface_hub<\/span><span class=\"p\">.<\/span><span class=\"nf\">login<\/span><span class=\"p\">()<\/span>\r\n<\/code><\/pre>\n<pre class=\"post-pre\"><code><span class=\"kn\">from<\/span> <span class=\"n\">transformers<\/span> <span class=\"kn\">import<\/span> <span class=\"n\">AutoModelForCausalLM<\/span><span class=\"p\">,<\/span> <span class=\"n\">AutoTokenizer<\/span>\r\n<span class=\"kn\">import<\/span> <span class=\"n\">torch<\/span>\r\n\r\n<span class=\"n\">model<\/span> <span class=\"o\">=<\/span> <span class=\"n\">AutoModelForCausalLM<\/span><span class=\"p\">.<\/span><span class=\"nf\">from_pretrained<\/span><span class=\"p\">(<\/span>\r\n    <span class=\"sh\">\"<\/span><span class=\"s\">meta-llama\/Llama-2-7b-chat-hf<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> \r\n    <span class=\"n\">torch_dtype<\/span><span class=\"o\">=<\/span><span class=\"n\">torch<\/span><span class=\"p\">.<\/span><span class=\"n\">bfloat16<\/span>\r\n<span class=\"p\">)<\/span>\r\n<span class=\"n\">tokenizer<\/span> <span class=\"o\">=<\/span> <span class=\"n\">AutoTokenizer<\/span><span class=\"p\">.<\/span><span class=\"nf\">from_pretrained<\/span><span class=\"p\">(<\/span>\r\n    <span class=\"sh\">\"<\/span><span class=\"s\">meta-llama\/Llama-2-7b-chat-hf<\/span><span class=\"sh\">\"<\/span>\r\n<span class=\"p\">)<\/span>\r\n<\/code><\/pre>\n<pre class=\"post-pre\"><code><span class=\"kn\">import<\/span> <span class=\"n\">mlflow<\/span>\r\n<span class=\"kn\">from<\/span> <span class=\"n\">mlflow.models.signature<\/span> <span class=\"kn\">import<\/span> <span class=\"n\">ModelSignature<\/span>\r\n<span class=\"kn\">from<\/span> <span class=\"n\">mlflow.types.schema<\/span> <span class=\"kn\">import<\/span> <span class=\"n\">ColSpec<\/span><span class=\"p\">,<\/span> <span class=\"n\">Schema<\/span>\r\n<span class=\"kn\">import<\/span> <span class=\"n\">numpy<\/span> <span class=\"k\">as<\/span> <span class=\"n\">np<\/span>\r\n\r\n<span class=\"c1\"># \u30e2\u30c7\u30eb\u306e\u5165\u51fa\u529b\u30b9\u30ad\u30fc\u30de\u306e\u5b9a\u7fa9\r\n<\/span><span class=\"n\">input_schema<\/span> <span class=\"o\">=<\/span> <span class=\"nc\">Schema<\/span><span class=\"p\">([<\/span>\r\n    <span class=\"nc\">ColSpec<\/span><span class=\"p\">(<\/span><span class=\"sh\">\"<\/span><span class=\"s\">string<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">prompt<\/span><span class=\"sh\">\"<\/span><span class=\"p\">),<\/span>\r\n    <span class=\"nc\">ColSpec<\/span><span class=\"p\">(<\/span><span class=\"sh\">\"<\/span><span class=\"s\">double<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">temperature<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"n\">optional<\/span><span class=\"o\">=<\/span><span class=\"bp\">True<\/span><span class=\"p\">),<\/span>\r\n    <span class=\"nc\">ColSpec<\/span><span class=\"p\">(<\/span><span class=\"sh\">\"<\/span><span class=\"s\">integer<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">max_tokens<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"n\">optional<\/span><span class=\"o\">=<\/span><span class=\"bp\">True<\/span><span class=\"p\">),<\/span>\r\n    <span class=\"nc\">ColSpec<\/span><span class=\"p\">(<\/span><span class=\"sh\">\"<\/span><span class=\"s\">string<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">stop<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"n\">optional<\/span><span class=\"o\">=<\/span><span class=\"bp\">True<\/span><span class=\"p\">),<\/span>\r\n    <span class=\"nc\">ColSpec<\/span><span class=\"p\">(<\/span><span class=\"sh\">\"<\/span><span class=\"s\">integer<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">candidate_count<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"n\">optional<\/span><span class=\"o\">=<\/span><span class=\"bp\">True<\/span><span class=\"p\">)<\/span>\r\n<span class=\"p\">])<\/span>\r\n\r\n<span class=\"n\">output_schema<\/span> <span class=\"o\">=<\/span> <span class=\"nc\">Schema<\/span><span class=\"p\">([<\/span>\r\n    <span class=\"nc\">ColSpec<\/span><span class=\"p\">(<\/span><span class=\"sh\">'<\/span><span class=\"s\">string<\/span><span class=\"sh\">'<\/span><span class=\"p\">,<\/span> <span class=\"sh\">'<\/span><span class=\"s\">predictions<\/span><span class=\"sh\">'<\/span><span class=\"p\">)<\/span>\r\n<span class=\"p\">])<\/span>\r\n\r\n<span class=\"n\">signature<\/span> <span class=\"o\">=<\/span> <span class=\"nc\">ModelSignature<\/span><span class=\"p\">(<\/span><span class=\"n\">inputs<\/span><span class=\"o\">=<\/span><span class=\"n\">input_schema<\/span><span class=\"p\">,<\/span> <span class=\"n\">outputs<\/span><span class=\"o\">=<\/span><span class=\"n\">output_schema<\/span><span class=\"p\">)<\/span>\r\n\r\n<span class=\"c1\"># \u5165\u529b\u30b5\u30f3\u30d7\u30eb\u306e\u5b9a\u7fa9\r\n<\/span><span class=\"n\">input_example<\/span> <span class=\"o\">=<\/span> <span class=\"p\">{<\/span>\r\n    <span class=\"sh\">\"<\/span><span class=\"s\">prompt<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"n\">np<\/span><span class=\"p\">.<\/span><span class=\"nf\">array<\/span><span class=\"p\">([<\/span>\r\n        <span class=\"sh\">\"<\/span><span class=\"s\">Below is an instruction that describes a task. <\/span><span class=\"sh\">\"<\/span>\r\n        <span class=\"sh\">\"<\/span><span class=\"s\">Write a response that appropriately completes the request.<\/span><span class=\"se\">\\n\\n<\/span><span class=\"sh\">\"<\/span>\r\n        <span class=\"sh\">\"<\/span><span class=\"s\">### Instruction:<\/span><span class=\"se\">\\n<\/span><span class=\"sh\">\"<\/span>\r\n        <span class=\"sh\">\"<\/span><span class=\"s\">What is Apache Spark?<\/span><span class=\"se\">\\n\\n<\/span><span class=\"sh\">\"<\/span>\r\n        <span class=\"sh\">\"<\/span><span class=\"s\">### Response:<\/span><span class=\"se\">\\n<\/span><span class=\"sh\">\"<\/span>\r\n    <span class=\"p\">])<\/span>\r\n<span class=\"p\">}<\/span>\r\n<\/code><\/pre>\n<p>\u8981\u542f\u7528\u6700\u4f18\u5316\u670d\u52a1\uff0c\u60a8\u9700\u8981\u5728\u8bb0\u5f55\u6a21\u578b\u65f6\u8c03\u7528mlflow.transformers.log_model\uff0c\u5e76\u5305\u542b\u4ee5\u4e0b\u65b9\u5f0f\u7684\u5b57\u5178\u4f5c\u4e3a\u9644\u52a0\u7684\u5143\u6570\u636e:<\/p>\n<pre class=\"post-pre\"><code>metadata = {\"task\": \"llm\/v1\/completions\"}\r\n<\/code><\/pre>\n<p>\u5728\u8fd9\u91cc\uff0c\u6211\u4eec\u6307\u5b9a\u4e86\u7528\u4e8e\u6a21\u578b\u670d\u52a1\u7aef\u70b9\u7684API\u7b7e\u540d\u3002<\/p>\n<pre class=\"post-pre\"><code><span class=\"kn\">import<\/span> <span class=\"n\">mlflow<\/span>\r\n\r\n<span class=\"c1\"># UC\u3067\u306e\u30e2\u30c7\u30eb\u7ba1\u7406\u3092\u884c\u308f\u306a\u3044\u5834\u5408\u306b\u306f\u4ee5\u4e0b\u306e\u884c\u3092\u30b3\u30e1\u30f3\u30c8\u30a2\u30a6\u30c8\u3057\u307e\u3059\r\n# 3\u30ec\u30d9\u30eb\u306e\u540d\u524d\u7a7a\u9593\u3067\u306f\u306a\u304f\u3001\u30b7\u30f3\u30d7\u30eb\u306b\u30e2\u30c7\u30eb\u540d\u3092\u6307\u5b9a\u3057\u307e\u3059\r\n<\/span><span class=\"n\">mlflow<\/span><span class=\"p\">.<\/span><span class=\"nf\">set_registry_uri<\/span><span class=\"p\">(<\/span><span class=\"sh\">'<\/span><span class=\"s\">databricks-uc<\/span><span class=\"sh\">'<\/span><span class=\"p\">)<\/span>\r\n<span class=\"n\">CATALOG<\/span> <span class=\"o\">=<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">quickstart_catalog_taka<\/span><span class=\"sh\">\"<\/span>\r\n<span class=\"n\">SCHEMA<\/span> <span class=\"o\">=<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">llm-catalog<\/span><span class=\"sh\">\"<\/span>\r\n<span class=\"n\">registered_model_name<\/span> <span class=\"o\">=<\/span> <span class=\"sa\">f<\/span><span class=\"sh\">\"<\/span><span class=\"si\">{<\/span><span class=\"n\">CATALOG<\/span><span class=\"si\">}<\/span><span class=\"s\">.<\/span><span class=\"si\">{<\/span><span class=\"n\">SCHEMA<\/span><span class=\"si\">}<\/span><span class=\"s\">.llama2-7b<\/span><span class=\"sh\">\"<\/span>\r\n\r\n<span class=\"c1\"># \u65b0\u898fMLflow\u30e9\u30f3\u3092\u30b9\u30bf\u30fc\u30c8\r\n<\/span><span class=\"k\">with<\/span> <span class=\"n\">mlflow<\/span><span class=\"p\">.<\/span><span class=\"nf\">start_run<\/span><span class=\"p\">():<\/span>\r\n    <span class=\"n\">components<\/span> <span class=\"o\">=<\/span> <span class=\"p\">{<\/span>\r\n        <span class=\"sh\">\"<\/span><span class=\"s\">model<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"n\">model<\/span><span class=\"p\">,<\/span>\r\n        <span class=\"sh\">\"<\/span><span class=\"s\">tokenizer<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"n\">tokenizer<\/span><span class=\"p\">,<\/span>\r\n    <span class=\"p\">}<\/span>\r\n    <span class=\"n\">mlflow<\/span><span class=\"p\">.<\/span><span class=\"n\">transformers<\/span><span class=\"p\">.<\/span><span class=\"nf\">log_model<\/span><span class=\"p\">(<\/span>\r\n        <span class=\"n\">transformers_model<\/span><span class=\"o\">=<\/span><span class=\"n\">components<\/span><span class=\"p\">,<\/span>\r\n        <span class=\"n\">task<\/span> <span class=\"o\">=<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">text-generation<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span>\r\n        <span class=\"n\">artifact_path<\/span><span class=\"o\">=<\/span><span class=\"sh\">\"<\/span><span class=\"s\">model<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span>\r\n        <span class=\"n\">registered_model_name<\/span><span class=\"o\">=<\/span><span class=\"n\">registered_model_name<\/span><span class=\"p\">,<\/span>\r\n        <span class=\"n\">signature<\/span><span class=\"o\">=<\/span><span class=\"n\">signature<\/span><span class=\"p\">,<\/span>\r\n        <span class=\"n\">input_example<\/span><span class=\"o\">=<\/span><span class=\"n\">input_example<\/span><span class=\"p\">,<\/span>\r\n        <span class=\"n\">metadata<\/span><span class=\"o\">=<\/span><span class=\"p\">{<\/span><span class=\"sh\">\"<\/span><span class=\"s\">task<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">llm\/v1\/completions<\/span><span class=\"sh\">\"<\/span><span class=\"p\">}<\/span>\r\n    <span class=\"p\">)<\/span>\r\n<\/code><\/pre>\n<div><img decoding=\"async\" class=\"post-images\" title=\"\" src=\"https:\/\/cdn.silicloud.com\/blog-img\/blog\/img\/657d9158913a08637a6df366\/18-0.png\" alt=\"Screenshot 2023-10-08 at 17.12.08.png\" \/><\/div>\n<div><img decoding=\"async\" class=\"post-images\" title=\"\" src=\"https:\/\/cdn.silicloud.com\/blog-img\/blog\/img\/657d9158913a08637a6df366\/19-0.png\" alt=\"Screenshot 2023-10-08 at 17.11.42.png\" \/><\/div>\n<h1>\u6b65\u9aa42\uff1a\u8bbe\u7f6e\u548c\u521b\u5efa\u6a21\u578b\u4fdd\u5b58\u7684GPU\u7aef\u70b9\u3002<\/h1>\n<p>\u8981\u66f4\u6539\u7ec8\u7aef\u8282\u70b9\u540d\uff0c\u8bf7\u4fee\u6539\u4ee5\u4e0b\u5355\u5143\u683c\u3002\u8c03\u7528\u7ec8\u7aef\u8282\u70b9API\u4e4b\u540e\uff0c\u8bb0\u5f55\u7684Llama2\u6a21\u578b\u5c06\u81ea\u52a8\u90e8\u7f72\u5230\u4f18\u5316\u7684LLM\u670d\u52a1\u4e2d\u3002workload_type\u9700\u8981\u6307\u5b9a\u73af\u5883\u4e2d\u53ef\u7528\u89c4\u683c\u7684GPU\u3002<\/p>\n<pre class=\"post-pre\"><code><span class=\"c1\"># MLflow\u30a8\u30f3\u30c9\u30dd\u30a4\u30f3\u30c8\u540d\u306e\u8a2d\u5b9a\r\n<\/span><span class=\"n\">endpoint_name<\/span> <span class=\"o\">=<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">taka-llama2-7b<\/span><span class=\"sh\">\"<\/span>\r\n\r\n<span class=\"c1\"># \u767b\u9332\u3055\u308c\u305fMLflow\u30e2\u30c7\u30eb\u540d\r\n<\/span><span class=\"n\">model_name<\/span> <span class=\"o\">=<\/span> <span class=\"n\">registered_model_name<\/span>\r\n\r\n<span class=\"c1\"># MLflow\u30e2\u30c7\u30eb\u306e\u6700\u65b0\u30d0\u30fc\u30b8\u30e7\u30f3\u306e\u53d6\u5f97\r\n<\/span><span class=\"n\">model_version<\/span> <span class=\"o\">=<\/span> <span class=\"mi\">1<\/span>\r\n\r\n<span class=\"c1\"># \u8a08\u7b97\u8cc7\u6e90\u30bf\u30a4\u30d7\u306e\u6307\u5b9a (CPU, GPU_SMALL, GPU_MEDIUM, etc.)\r\n<\/span><span class=\"n\">workload_type<\/span> <span class=\"o\">=<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">GPU_MEDIUM<\/span><span class=\"sh\">\"<\/span>\r\n\r\n<span class=\"c1\"># \u8a08\u7b97\u8cc7\u6e90\u306e\u30b9\u30b1\u30fc\u30eb\u30a2\u30a6\u30c8\u30b5\u30a4\u30ba\u306e\u6307\u5b9a (Small, Medium, Large, etc.)\r\n<\/span><span class=\"n\">workload_size<\/span> <span class=\"o\">=<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">Small<\/span><span class=\"sh\">\"<\/span> \r\n\r\n<span class=\"c1\"># \u30bc\u30ed\u3078\u306e\u30b9\u30b1\u30fc\u30eb\u306e\u6307\u5b9a (CPU\u30a8\u30f3\u30c9\u30dd\u30a4\u30f3\u30c8\u3067\u306e\u307f\u30b5\u30dd\u30fc\u30c8)\r\n<\/span><span class=\"n\">scale_to_zero<\/span> <span class=\"o\">=<\/span> <span class=\"bp\">False<\/span> \r\n\r\n<span class=\"c1\"># \u73fe\u5728\u306e\u30ce\u30fc\u30c8\u30d6\u30c3\u30af\u30b3\u30f3\u30c6\u30ad\u30b9\u30c8\u304b\u3089API\u30a8\u30f3\u30c9\u30dd\u30a4\u30f3\u30c8\u3068\u30c8\u30fc\u30af\u30f3\u3092\u53d6\u5f97\r\n<\/span><span class=\"n\">API_ROOT<\/span> <span class=\"o\">=<\/span> <span class=\"n\">dbutils<\/span><span class=\"p\">.<\/span><span class=\"n\">notebook<\/span><span class=\"p\">.<\/span><span class=\"n\">entry_point<\/span><span class=\"p\">.<\/span><span class=\"nf\">getDbutils<\/span><span class=\"p\">().<\/span><span class=\"nf\">notebook<\/span><span class=\"p\">().<\/span><span class=\"nf\">getContext<\/span><span class=\"p\">().<\/span><span class=\"nf\">apiUrl<\/span><span class=\"p\">().<\/span><span class=\"nf\">get<\/span><span class=\"p\">()<\/span> \r\n<span class=\"n\">API_TOKEN<\/span> <span class=\"o\">=<\/span> <span class=\"n\">dbutils<\/span><span class=\"p\">.<\/span><span class=\"n\">notebook<\/span><span class=\"p\">.<\/span><span class=\"n\">entry_point<\/span><span class=\"p\">.<\/span><span class=\"nf\">getDbutils<\/span><span class=\"p\">().<\/span><span class=\"nf\">notebook<\/span><span class=\"p\">().<\/span><span class=\"nf\">getContext<\/span><span class=\"p\">().<\/span><span class=\"nf\">apiToken<\/span><span class=\"p\">().<\/span><span class=\"nf\">get<\/span><span class=\"p\">()<\/span>\r\n<\/code><\/pre>\n<pre class=\"post-pre\"><code><span class=\"kn\">import<\/span> <span class=\"n\">requests<\/span>\r\n<span class=\"kn\">import<\/span> <span class=\"n\">json<\/span>\r\n\r\n<span class=\"n\">data<\/span> <span class=\"o\">=<\/span> <span class=\"p\">{<\/span>\r\n    <span class=\"sh\">\"<\/span><span class=\"s\">name<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"n\">endpoint_name<\/span><span class=\"p\">,<\/span>\r\n    <span class=\"sh\">\"<\/span><span class=\"s\">config<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"p\">{<\/span>\r\n        <span class=\"sh\">\"<\/span><span class=\"s\">served_models<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"p\">[<\/span>\r\n            <span class=\"p\">{<\/span>\r\n                <span class=\"sh\">\"<\/span><span class=\"s\">model_name<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"n\">model_name<\/span><span class=\"p\">,<\/span>\r\n                <span class=\"sh\">\"<\/span><span class=\"s\">model_version<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"n\">model_version<\/span><span class=\"p\">,<\/span>\r\n                <span class=\"sh\">\"<\/span><span class=\"s\">workload_size<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"n\">workload_size<\/span><span class=\"p\">,<\/span>\r\n                <span class=\"sh\">\"<\/span><span class=\"s\">scale_to_zero_enabled<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"n\">scale_to_zero<\/span><span class=\"p\">,<\/span>\r\n                <span class=\"sh\">\"<\/span><span class=\"s\">workload_type<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"n\">workload_type<\/span><span class=\"p\">,<\/span>\r\n            <span class=\"p\">}<\/span>\r\n        <span class=\"p\">]<\/span>\r\n    <span class=\"p\">},<\/span>\r\n<span class=\"p\">}<\/span>\r\n\r\n<span class=\"n\">headers<\/span> <span class=\"o\">=<\/span> <span class=\"p\">{<\/span><span class=\"sh\">\"<\/span><span class=\"s\">Context-Type<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">text\/json<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">Authorization<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"sa\">f<\/span><span class=\"sh\">\"<\/span><span class=\"s\">Bearer <\/span><span class=\"si\">{<\/span><span class=\"n\">API_TOKEN<\/span><span class=\"si\">}<\/span><span class=\"sh\">\"<\/span><span class=\"p\">}<\/span>\r\n\r\n<span class=\"n\">response<\/span> <span class=\"o\">=<\/span> <span class=\"n\">requests<\/span><span class=\"p\">.<\/span><span class=\"nf\">post<\/span><span class=\"p\">(<\/span><span class=\"n\">url<\/span><span class=\"o\">=<\/span><span class=\"sa\">f<\/span><span class=\"sh\">\"<\/span><span class=\"si\">{<\/span><span class=\"n\">API_ROOT<\/span><span class=\"si\">}<\/span><span class=\"s\">\/api\/2.0\/serving-endpoints<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"n\">json<\/span><span class=\"o\">=<\/span><span class=\"n\">data<\/span><span class=\"p\">,<\/span> <span class=\"n\">headers<\/span><span class=\"o\">=<\/span><span class=\"n\">headers<\/span><span class=\"p\">)<\/span>\r\n\r\n<span class=\"nf\">print<\/span><span class=\"p\">(<\/span><span class=\"n\">json<\/span><span class=\"p\">.<\/span><span class=\"nf\">dumps<\/span><span class=\"p\">(<\/span><span class=\"n\">response<\/span><span class=\"p\">.<\/span><span class=\"nf\">json<\/span><span class=\"p\">(),<\/span> <span class=\"n\">indent<\/span><span class=\"o\">=<\/span><span class=\"mi\">4<\/span><span class=\"p\">))<\/span>\r\n<\/code><\/pre>\n<h1>\u53c2\u8003\u7aef\u70b9<\/h1>\n<div><img decoding=\"async\" class=\"post-images\" title=\"\" src=\"https:\/\/cdn.silicloud.com\/blog-img\/blog\/img\/657d9158913a08637a6df366\/25-0.png\" alt=\"Screenshot 2023-10-09 at 15.00.59.png\" \/><\/div>\n<h1>\u6b65\u9aa43\uff1a\u67e5\u8be2\u7ec8\u8282\u70b9<\/h1>\n<p>\u5f53\u51c6\u5907\u597d\u7ec8\u7aef\u70b9\u540e\uff0c\u901a\u8fc7\u8fdb\u884cAPI\u8bf7\u6c42\u53ef\u4ee5\u8fdb\u884c\u67e5\u8be2\u3002\u8fd9\u53d6\u51b3\u4e8e\u6a21\u578b\u7684\u5927\u5c0f\u548c\u590d\u6742\u6027\uff0c\u4f46\u51c6\u5907\u65f6\u95f4\u9700\u898130\u5206\u949f\u4ee5\u4e0a\u3002<\/p>\n<div>GPU Medium\u7684\u60c5\u51b5\u4e0b\uff0c\u5927\u7ea630\u5206\u949f\u5c31\u4f1a\u51c6\u5907\u597d\u3002<\/div>\n<pre class=\"post-pre\"><code><span class=\"n\">data<\/span> <span class=\"o\">=<\/span> <span class=\"p\">{<\/span>\r\n    <span class=\"sh\">\"<\/span><span class=\"s\">inputs<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"p\">{<\/span>\r\n        <span class=\"sh\">\"<\/span><span class=\"s\">prompt<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"p\">[<\/span>\r\n            <span class=\"sh\">\"<\/span><span class=\"s\">Below is an instruction that describes a task. Write a response that appropriately completes the request.<\/span><span class=\"se\">\\n\\n<\/span><span class=\"s\">### Instruction:<\/span><span class=\"se\">\\n<\/span><span class=\"s\">What is Apache Spark?<\/span><span class=\"se\">\\n\\n<\/span><span class=\"s\">### Response:<\/span><span class=\"se\">\\n<\/span><span class=\"sh\">\"<\/span>\r\n        <span class=\"p\">]<\/span>\r\n    <span class=\"p\">},<\/span>\r\n    <span class=\"sh\">\"<\/span><span class=\"s\">params<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"p\">{<\/span>\r\n        <span class=\"sh\">\"<\/span><span class=\"s\">max_tokens<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"mi\">100<\/span><span class=\"p\">,<\/span> \r\n        <span class=\"sh\">\"<\/span><span class=\"s\">temperature<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"mf\">0.0<\/span>\r\n    <span class=\"p\">}<\/span>\r\n<span class=\"p\">}<\/span>\r\n\r\n<span class=\"n\">headers<\/span> <span class=\"o\">=<\/span> <span class=\"p\">{<\/span>\r\n    <span class=\"sh\">\"<\/span><span class=\"s\">Context-Type<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">text\/json<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span>\r\n    <span class=\"sh\">\"<\/span><span class=\"s\">Authorization<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"sa\">f<\/span><span class=\"sh\">\"<\/span><span class=\"s\">Bearer <\/span><span class=\"si\">{<\/span><span class=\"n\">API_TOKEN<\/span><span class=\"si\">}<\/span><span class=\"sh\">\"<\/span>\r\n<span class=\"p\">}<\/span>\r\n\r\n<span class=\"n\">response<\/span> <span class=\"o\">=<\/span> <span class=\"n\">requests<\/span><span class=\"p\">.<\/span><span class=\"nf\">post<\/span><span class=\"p\">(<\/span>\r\n    <span class=\"n\">url<\/span><span class=\"o\">=<\/span><span class=\"sa\">f<\/span><span class=\"sh\">\"<\/span><span class=\"si\">{<\/span><span class=\"n\">API_ROOT<\/span><span class=\"si\">}<\/span><span class=\"s\">\/serving-endpoints\/<\/span><span class=\"si\">{<\/span><span class=\"n\">endpoint_name<\/span><span class=\"si\">}<\/span><span class=\"s\">\/invocations<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span>\r\n    <span class=\"n\">json<\/span><span class=\"o\">=<\/span><span class=\"n\">data<\/span><span class=\"p\">,<\/span>\r\n    <span class=\"n\">headers<\/span><span class=\"o\">=<\/span><span class=\"n\">headers<\/span>\r\n<span class=\"p\">)<\/span>\r\n\r\n<span class=\"nf\">print<\/span><span class=\"p\">(<\/span><span class=\"n\">json<\/span><span class=\"p\">.<\/span><span class=\"nf\">dumps<\/span><span class=\"p\">(<\/span><span class=\"n\">response<\/span><span class=\"p\">.<\/span><span class=\"nf\">json<\/span><span class=\"p\">(),<\/span> <span class=\"n\">indent<\/span><span class=\"o\">=<\/span><span class=\"mi\">4<\/span><span class=\"p\">))<\/span>\r\n<\/code><\/pre>\n<p>\u67e5\u8be2\u6210\u529f\uff01<\/p>\n<pre class=\"post-pre\"><code><span class=\"p\">{<\/span>\r\n    <span class=\"nl\">\"predictions\"<\/span><span class=\"p\">:<\/span> <span class=\"p\">[<\/span>\r\n        <span class=\"p\">{<\/span>\r\n            <span class=\"nl\">\"candidates\"<\/span><span class=\"p\">:<\/span> <span class=\"p\">[<\/span>\r\n                <span class=\"p\">{<\/span>\r\n                    <span class=\"nl\">\"text\"<\/span><span class=\"p\">:<\/span> <span class=\"s2\">\"Apache Spark is an open-source data processing engine that can handle large-scale data processing tasks. It was developed at the University of California, Berkeley and is now maintained by Apache Software Foundation. Spark provides high-level APIs in Java, Python, Scala, and R, and supports a wide range of data sources, including Hadoop Distributed File System (HDFS), Cassandra, HBase, and Hive. Spark's core features include in-memory computing, fault\"<\/span><span class=\"p\">,<\/span>\r\n                    <span class=\"nl\">\"metadata\"<\/span><span class=\"p\">:<\/span> <span class=\"p\">{<\/span>\r\n                        <span class=\"nl\">\"finish_reason\"<\/span><span class=\"p\">:<\/span> <span class=\"s2\">\"length\"<\/span>\r\n                    <span class=\"p\">}<\/span>\r\n                <span class=\"p\">}<\/span>\r\n            <span class=\"p\">],<\/span>\r\n            <span class=\"nl\">\"metadata\"<\/span><span class=\"p\">:<\/span> <span class=\"p\">{<\/span>\r\n                <span class=\"nl\">\"input_tokens\"<\/span><span class=\"p\">:<\/span> <span class=\"mi\">41<\/span><span class=\"p\">,<\/span>\r\n                <span class=\"nl\">\"output_tokens\"<\/span><span class=\"p\">:<\/span> <span class=\"mi\">100<\/span><span class=\"p\">,<\/span>\r\n                <span class=\"nl\">\"total_tokens\"<\/span><span class=\"p\">:<\/span> <span class=\"mi\">141<\/span>\r\n            <span class=\"p\">}<\/span>\r\n        <span class=\"p\">}<\/span>\r\n    <span class=\"p\">]<\/span>\r\n<span class=\"p\">}<\/span>\r\n<\/code><\/pre>\n<h3>Databricks\u5feb\u901f\u5165\u95e8\u6307\u5357<\/h3>\n<p>Databricks\u5feb\u901f\u5165\u95e8\u6307\u5357<\/p>\n<h3>\u6570\u636e\u8109\u51b2\u514d\u8d39\u8bd5\u7528<\/h3>\n<p>Databricks\u514d\u8d39\u8bd5\u7528<\/p>\n","protected":false},"excerpt":{"rendered":"<p>\u6211\u4f1a\u4e3a\u60a8\u8fdb\u884c\u6d4f\u89c8\u8fd9\u4e2a\u793a\u4f8b\u7b14\u8bb0\u672c\u3002 &nbsp; Llama2\u670d\u52a1\u7684\u4f18\u5316\u793a\u4f8b \u901a\u8fc7\u6700\u4f18\u5316LLM\u4fdd\u5b58\uff0c\u60a8\u53ef\u4ee5\u5c06Da [&hellip;]<\/p>\n","protected":false},"author":11,"featured_media":0,"comment_status":"closed","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[1],"tags":[],"class_list":["post-50410","post","type-post","status-publish","format-standard","hentry","category-uncategorized"],"yoast_head":"<!-- This site is optimized with the Yoast SEO Premium plugin v21.5 (Yoast SEO v21.5) - https:\/\/yoast.com\/wordpress\/plugins\/seo\/ -->\n<title>\u5c1d\u8bd5\u5728Databricks\u7684LLM\u4f18\u5316\u6a21\u578b\u670d\u52a1\u4e2d\u90e8\u7f72Llama2\u6a21\u578b - Blog - Silicon Cloud<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/www.silicloud.com\/zh\/blog\/\u5c1d\u8bd5\u5728databricks\u7684llm\u4f18\u5316\u6a21\u578b\u670d\u52a1\u4e2d\u90e8\u7f72llama2\u6a21\u578b\u3002\/\" \/>\n<meta property=\"og:locale\" content=\"zh_CN\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"\u5c1d\u8bd5\u5728Databricks\u7684LLM\u4f18\u5316\u6a21\u578b\u670d\u52a1\u4e2d\u90e8\u7f72Llama2\u6a21\u578b\" \/>\n<meta property=\"og:description\" content=\"\u6211\u4f1a\u4e3a\u60a8\u8fdb\u884c\u6d4f\u89c8\u8fd9\u4e2a\u793a\u4f8b\u7b14\u8bb0\u672c\u3002 &nbsp; Llama2\u670d\u52a1\u7684\u4f18\u5316\u793a\u4f8b \u901a\u8fc7\u6700\u4f18\u5316LLM\u4fdd\u5b58\uff0c\u60a8\u53ef\u4ee5\u5c06Da [&hellip;]\" \/>\n<meta property=\"og:url\" content=\"https:\/\/www.silicloud.com\/zh\/blog\/\u5c1d\u8bd5\u5728databricks\u7684llm\u4f18\u5316\u6a21\u578b\u670d\u52a1\u4e2d\u90e8\u7f72llama2\u6a21\u578b\u3002\/\" \/>\n<meta property=\"og:site_name\" content=\"Blog - Silicon Cloud\" \/>\n<meta property=\"article:published_time\" content=\"2024-01-26T13:34:42+00:00\" \/>\n<meta property=\"article:modified_time\" content=\"2024-04-30T09:35:43+00:00\" \/>\n<meta property=\"og:image\" content=\"https:\/\/cdn.silicloud.com\/blog-img\/blog\/img\/657d9158913a08637a6df366\/18-0.png\" \/>\n<meta name=\"author\" content=\"\u65b0, \u97f5\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:label1\" content=\"\u4f5c\u8005\" \/>\n\t<meta name=\"twitter:data1\" content=\"\u65b0, \u97f5\" \/>\n\t<meta name=\"twitter:label2\" content=\"\u9884\u8ba1\u9605\u8bfb\u65f6\u95f4\" \/>\n\t<meta name=\"twitter:data2\" content=\"3 \u5206\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\/\/schema.org\",\"@graph\":[{\"@type\":\"WebPage\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/%e5%b0%9d%e8%af%95%e5%9c%a8databricks%e7%9a%84llm%e4%bc%98%e5%8c%96%e6%a8%a1%e5%9e%8b%e6%9c%8d%e5%8a%a1%e4%b8%ad%e9%83%a8%e7%bd%b2llama2%e6%a8%a1%e5%9e%8b%e3%80%82\/\",\"url\":\"https:\/\/www.silicloud.com\/zh\/blog\/%e5%b0%9d%e8%af%95%e5%9c%a8databricks%e7%9a%84llm%e4%bc%98%e5%8c%96%e6%a8%a1%e5%9e%8b%e6%9c%8d%e5%8a%a1%e4%b8%ad%e9%83%a8%e7%bd%b2llama2%e6%a8%a1%e5%9e%8b%e3%80%82\/\",\"name\":\"\u5c1d\u8bd5\u5728Databricks\u7684LLM\u4f18\u5316\u6a21\u578b\u670d\u52a1\u4e2d\u90e8\u7f72Llama2\u6a21\u578b - Blog - Silicon Cloud\",\"isPartOf\":{\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/#website\"},\"datePublished\":\"2024-01-26T13:34:42+00:00\",\"dateModified\":\"2024-04-30T09:35:43+00:00\",\"author\":{\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/4ba4019495123db3038fd0809e6959c9\"},\"breadcrumb\":{\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/%e5%b0%9d%e8%af%95%e5%9c%a8databricks%e7%9a%84llm%e4%bc%98%e5%8c%96%e6%a8%a1%e5%9e%8b%e6%9c%8d%e5%8a%a1%e4%b8%ad%e9%83%a8%e7%bd%b2llama2%e6%a8%a1%e5%9e%8b%e3%80%82\/#breadcrumb\"},\"inLanguage\":\"zh-Hans\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"https:\/\/www.silicloud.com\/zh\/blog\/%e5%b0%9d%e8%af%95%e5%9c%a8databricks%e7%9a%84llm%e4%bc%98%e5%8c%96%e6%a8%a1%e5%9e%8b%e6%9c%8d%e5%8a%a1%e4%b8%ad%e9%83%a8%e7%bd%b2llama2%e6%a8%a1%e5%9e%8b%e3%80%82\/\"]}]},{\"@type\":\"BreadcrumbList\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/%e5%b0%9d%e8%af%95%e5%9c%a8databricks%e7%9a%84llm%e4%bc%98%e5%8c%96%e6%a8%a1%e5%9e%8b%e6%9c%8d%e5%8a%a1%e4%b8%ad%e9%83%a8%e7%bd%b2llama2%e6%a8%a1%e5%9e%8b%e3%80%82\/#breadcrumb\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"\u9996\u9875\",\"item\":\"https:\/\/www.silicloud.com\/zh\/blog\/\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"\u5c1d\u8bd5\u5728Databricks\u7684LLM\u4f18\u5316\u6a21\u578b\u670d\u52a1\u4e2d\u90e8\u7f72Llama2\u6a21\u578b\"}]},{\"@type\":\"WebSite\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/#website\",\"url\":\"https:\/\/www.silicloud.com\/zh\/blog\/\",\"name\":\"Blog - Silicon Cloud\",\"description\":\"\",\"inLanguage\":\"zh-Hans\"},{\"@type\":\"Person\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/4ba4019495123db3038fd0809e6959c9\",\"name\":\"\u65b0, \u97f5\",\"image\":{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/image\/\",\"url\":\"https:\/\/secure.gravatar.com\/avatar\/d484b6c6e4ae82e8a9efea989e1d2af46d9b6ef128101e63b18f559fca0ae627?s=96&d=mm&r=g\",\"contentUrl\":\"https:\/\/secure.gravatar.com\/avatar\/d484b6c6e4ae82e8a9efea989e1d2af46d9b6ef128101e63b18f559fca0ae627?s=96&d=mm&r=g\",\"caption\":\"\u65b0, \u97f5\"},\"url\":\"https:\/\/www.silicloud.com\/zh\/blog\/author\/yunxin\/\"},{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/%e5%b0%9d%e8%af%95%e5%9c%a8databricks%e7%9a%84llm%e4%bc%98%e5%8c%96%e6%a8%a1%e5%9e%8b%e6%9c%8d%e5%8a%a1%e4%b8%ad%e9%83%a8%e7%bd%b2llama2%e6%a8%a1%e5%9e%8b%e3%80%82\/#local-main-organization-logo\",\"url\":\"\",\"contentUrl\":\"\",\"caption\":\"Blog - Silicon Cloud\"}]}<\/script>\n<!-- \/ Yoast SEO Premium plugin. -->","yoast_head_json":{"title":"\u5c1d\u8bd5\u5728Databricks\u7684LLM\u4f18\u5316\u6a21\u578b\u670d\u52a1\u4e2d\u90e8\u7f72Llama2\u6a21\u578b - Blog - Silicon Cloud","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/www.silicloud.com\/zh\/blog\/\u5c1d\u8bd5\u5728databricks\u7684llm\u4f18\u5316\u6a21\u578b\u670d\u52a1\u4e2d\u90e8\u7f72llama2\u6a21\u578b\u3002\/","og_locale":"zh_CN","og_type":"article","og_title":"\u5c1d\u8bd5\u5728Databricks\u7684LLM\u4f18\u5316\u6a21\u578b\u670d\u52a1\u4e2d\u90e8\u7f72Llama2\u6a21\u578b","og_description":"\u6211\u4f1a\u4e3a\u60a8\u8fdb\u884c\u6d4f\u89c8\u8fd9\u4e2a\u793a\u4f8b\u7b14\u8bb0\u672c\u3002 &nbsp; Llama2\u670d\u52a1\u7684\u4f18\u5316\u793a\u4f8b \u901a\u8fc7\u6700\u4f18\u5316LLM\u4fdd\u5b58\uff0c\u60a8\u53ef\u4ee5\u5c06Da [&hellip;]","og_url":"https:\/\/www.silicloud.com\/zh\/blog\/\u5c1d\u8bd5\u5728databricks\u7684llm\u4f18\u5316\u6a21\u578b\u670d\u52a1\u4e2d\u90e8\u7f72llama2\u6a21\u578b\u3002\/","og_site_name":"Blog - Silicon Cloud","article_published_time":"2024-01-26T13:34:42+00:00","article_modified_time":"2024-04-30T09:35:43+00:00","og_image":[{"url":"https:\/\/cdn.silicloud.com\/blog-img\/blog\/img\/657d9158913a08637a6df366\/18-0.png"}],"author":"\u65b0, \u97f5","twitter_card":"summary_large_image","twitter_misc":{"\u4f5c\u8005":"\u65b0, \u97f5","\u9884\u8ba1\u9605\u8bfb\u65f6\u95f4":"3 \u5206"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"WebPage","@id":"https:\/\/www.silicloud.com\/zh\/blog\/%e5%b0%9d%e8%af%95%e5%9c%a8databricks%e7%9a%84llm%e4%bc%98%e5%8c%96%e6%a8%a1%e5%9e%8b%e6%9c%8d%e5%8a%a1%e4%b8%ad%e9%83%a8%e7%bd%b2llama2%e6%a8%a1%e5%9e%8b%e3%80%82\/","url":"https:\/\/www.silicloud.com\/zh\/blog\/%e5%b0%9d%e8%af%95%e5%9c%a8databricks%e7%9a%84llm%e4%bc%98%e5%8c%96%e6%a8%a1%e5%9e%8b%e6%9c%8d%e5%8a%a1%e4%b8%ad%e9%83%a8%e7%bd%b2llama2%e6%a8%a1%e5%9e%8b%e3%80%82\/","name":"\u5c1d\u8bd5\u5728Databricks\u7684LLM\u4f18\u5316\u6a21\u578b\u670d\u52a1\u4e2d\u90e8\u7f72Llama2\u6a21\u578b - Blog - Silicon Cloud","isPartOf":{"@id":"https:\/\/www.silicloud.com\/zh\/blog\/#website"},"datePublished":"2024-01-26T13:34:42+00:00","dateModified":"2024-04-30T09:35:43+00:00","author":{"@id":"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/4ba4019495123db3038fd0809e6959c9"},"breadcrumb":{"@id":"https:\/\/www.silicloud.com\/zh\/blog\/%e5%b0%9d%e8%af%95%e5%9c%a8databricks%e7%9a%84llm%e4%bc%98%e5%8c%96%e6%a8%a1%e5%9e%8b%e6%9c%8d%e5%8a%a1%e4%b8%ad%e9%83%a8%e7%bd%b2llama2%e6%a8%a1%e5%9e%8b%e3%80%82\/#breadcrumb"},"inLanguage":"zh-Hans","potentialAction":[{"@type":"ReadAction","target":["https:\/\/www.silicloud.com\/zh\/blog\/%e5%b0%9d%e8%af%95%e5%9c%a8databricks%e7%9a%84llm%e4%bc%98%e5%8c%96%e6%a8%a1%e5%9e%8b%e6%9c%8d%e5%8a%a1%e4%b8%ad%e9%83%a8%e7%bd%b2llama2%e6%a8%a1%e5%9e%8b%e3%80%82\/"]}]},{"@type":"BreadcrumbList","@id":"https:\/\/www.silicloud.com\/zh\/blog\/%e5%b0%9d%e8%af%95%e5%9c%a8databricks%e7%9a%84llm%e4%bc%98%e5%8c%96%e6%a8%a1%e5%9e%8b%e6%9c%8d%e5%8a%a1%e4%b8%ad%e9%83%a8%e7%bd%b2llama2%e6%a8%a1%e5%9e%8b%e3%80%82\/#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"\u9996\u9875","item":"https:\/\/www.silicloud.com\/zh\/blog\/"},{"@type":"ListItem","position":2,"name":"\u5c1d\u8bd5\u5728Databricks\u7684LLM\u4f18\u5316\u6a21\u578b\u670d\u52a1\u4e2d\u90e8\u7f72Llama2\u6a21\u578b"}]},{"@type":"WebSite","@id":"https:\/\/www.silicloud.com\/zh\/blog\/#website","url":"https:\/\/www.silicloud.com\/zh\/blog\/","name":"Blog - Silicon Cloud","description":"","inLanguage":"zh-Hans"},{"@type":"Person","@id":"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/4ba4019495123db3038fd0809e6959c9","name":"\u65b0, \u97f5","image":{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/image\/","url":"https:\/\/secure.gravatar.com\/avatar\/d484b6c6e4ae82e8a9efea989e1d2af46d9b6ef128101e63b18f559fca0ae627?s=96&d=mm&r=g","contentUrl":"https:\/\/secure.gravatar.com\/avatar\/d484b6c6e4ae82e8a9efea989e1d2af46d9b6ef128101e63b18f559fca0ae627?s=96&d=mm&r=g","caption":"\u65b0, \u97f5"},"url":"https:\/\/www.silicloud.com\/zh\/blog\/author\/yunxin\/"},{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"https:\/\/www.silicloud.com\/zh\/blog\/%e5%b0%9d%e8%af%95%e5%9c%a8databricks%e7%9a%84llm%e4%bc%98%e5%8c%96%e6%a8%a1%e5%9e%8b%e6%9c%8d%e5%8a%a1%e4%b8%ad%e9%83%a8%e7%bd%b2llama2%e6%a8%a1%e5%9e%8b%e3%80%82\/#local-main-organization-logo","url":"","contentUrl":"","caption":"Blog - Silicon Cloud"}]}},"_links":{"self":[{"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/posts\/50410","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/users\/11"}],"replies":[{"embeddable":true,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/comments?post=50410"}],"version-history":[{"count":2,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/posts\/50410\/revisions"}],"predecessor-version":[{"id":93313,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/posts\/50410\/revisions\/93313"}],"wp:attachment":[{"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/media?parent=50410"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/categories?post=50410"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/tags?post=50410"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}