mesolitica/chatgpt-malay-function-call
收藏马来语功能调用指令数据集
数据集概述
该数据集包含马来语的功能调用指令,原始数据来自 https://huggingface.co/datasets/glaiveai/glaive-function-calling-v2,感谢 https://github.com/aisyahrzk 和 https://github.com/KamarulAdha 找到最佳的提示来进化。数据集使用 ChatGPT3.5 生成,相关笔记本可在 https://github.com/mesolitica/malaysian-dataset/tree/master/chatbot/evol-function-call 找到。
数据文件
function-calls.jsonl:包含 179450 行,大小为 200 MB。function-calls-complex.jsonl:包含 24986 行,大小为 27.8 MB。
示例数据
示例1
json { "function_call": "{ "name": "get_news_headlines", "description": "Dapatkan tajuk berita terkini", "parameters": { "type": "object", "properties": { "country": { "type": "string", "description": "Negara untuk mendapatkan berita" } }, "required": [ "country" ] } }", "conversations": [ { "role": "user", "content": "Bolehkah anda memberitahu saya tajuk berita terkini untuk Amerika Syarikat?" }, { "role": "assistant", "content": "<functioncall> {"name": "get_news_headlines", "arguments": "{"country": "Amerika Syarikat"}"}" }, { "role": "user", "content": "Itu menarik. Bagaimana pula dengan berita di Perancis?" }, { "role": "assistant", "content": "<functioncall> {"name": "get_news_headlines", "arguments": "{"country": "Perancis"}"}" } ] }
示例2
json { "function_call": "{ "name": "generate_password", "description": "Menghasilkan kata laluan rawak dengan kriteria yang ditetapkan", "parameters": { "type": "object", "properties": { "length": { "type": "integer", "description": "Panjang kata laluan" }, "include_numbers": { "type": "boolean", "description": "Termasuk nombor dalam kata laluan" }, "include_special_characters": { "type": "boolean", "description": "Termasuk karakter-karakter istimewa dalam kata laluan" } }, "required": [ "length" ] } }", "conversations": [ { "role": "user", "content": "Saya mahu ia panjang 12 aksara dan ya, ia patut termasuk kedua-dua nombor dan karakter istimewa." }, { "role": "assistant", "content": "<functioncall> {"name": "generate_password", "arguments": "{"length": 12, "include_numbers": True, "include_special_characters": True}"}" } ] }
示例3
json { "function_call": "{"name": "GeneratePurchaseOrder","description":"Fungsi ini digunakan untuk menghasilkan pesanan pembelian. Ia menerima maklumat produk, kuantiti, harga dan alamat penghantaran. Setiap produk perlu disertakan dengan kuantiti yang dikehendaki.","parameters":{"type":"object","properties":{"products":{"type":"array","items":{"type":"object","properties":{"product_name":{"type":"string","description":"Nama produk yang dipesan."},"quantity":{"type":"integer","description":"Kuantiti produk yang dikehendaki."},"price":{"type":"number","description":"Harga bagi satu unit produk."}},"required":["product_name","quantity","price"]}},"delivery_address":{"type":"string","description":"Alamat lengkap untuk penghantaran."}},"required":["products","delivery_address"]}}", "conversations": [ { "role": "user", "content": "Saya ingin membuat pesanan pembelian. Produk yang saya perlukan ialah:
- T-shirt, kuantiti 5, harga 25.50
- Kasut sukan, kuantiti 2, harga 80.00 Alamat penghantaran: No. 123, Jalan Merdeka, 68000 Ampang." }, { "role": "assistant", "content": "<functioncall> {name: GeneratePurchaseOrder, arguments: {products: [{product_name: T-shirt, quantity: 5, price: 25.5}, {product_name: Kasut sukan, quantity: 2, price: 80.0}], delivery_address: No. 123, Jalan Merdeka, 68000 Ampang}}" } ] }



