{"cells":[{"cell_type":"markdown","metadata":{"id":"T9u-JTdTpMzM"},"source":["## Dataset"]},{"cell_type":"code","execution_count":null,"metadata":{"id":"PQtPVQfKn7h-"},"outputs":[],"source":["from google.colab import data_table; data_table.enable_dataframe_formatter()\n","import numpy as np; np.random.seed(123)\n","import pandas as pd"]},{"cell_type":"code","execution_count":null,"metadata":{"id":"oqsw1ni_sN_b"},"outputs":[],"source":["df = pd.read_json(\"https://raw.githubusercontent.com/sahil280114/codealpaca/master/data/code_alpaca_20k.json\")\n","\n","# create a new column called `split` where:\n","# 90% will be assigned a value of 0 -> train set\n","# 5% will be assigned a value of 1 -> validation set\n","# 5% will be assigned a value of 2 -> test set\n","\n","total_rows = len(df)\n","split_0_count = int(total_rows * 0.9)\n","split_1_count = int(total_rows * 0.05)\n","split_2_count = total_rows - split_0_count - split_1_count\n","\n","# Create an array with split values based on the counts\n","split_values = np.concatenate([\n"," np.zeros(split_0_count),\n"," np.ones(split_1_count),\n"," np.full(split_2_count, 2)\n","])\n","\n","# Shuffle the array to ensure randomness\n","np.random.shuffle(split_values)\n","\n","# Add the 'split' column to the DataFrame\n","df['split'] = split_values\n","df['split'] = df['split'].astype(int)\n","df = df.head(n=1000)"]},{"cell_type":"code","execution_count":null,"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":618},"executionInfo":{"elapsed":5,"status":"ok","timestamp":1703888311059,"user":{"displayName":"Yufei Wang","userId":"15670977446030042093"},"user_tz":480},"id":"tgdeMSpEobGr","outputId":"b2a5cc10-ef79-40ee-a474-50e2cc48e00e"},"outputs":[{"output_type":"execute_result","data":{"text/plain":[" instruction \\\n","0 Create an array of length 5 which contains all... \n","1 Formulate an equation to calculate the height ... \n","2 Write a replace method for a string class whic... \n","3 Create an array of length 15 containing number... \n","4 Write a function to find the number of distinc... \n","5 Create a nested loop to print every combinatio... \n","6 Write a function to find the maximum differenc... \n","7 Write a function to generate the nth Fibonacci... \n","8 Write a class to represent a 2D point with x a... \n","9 Write code that removes spaces from a given st... \n","\n"," input \\\n","0 \n","1 \n","2 string = \"Hello World!\"\\nreplace_with = \"Greet... \n","3 \n","4 matrix = [[1, 0, 0],\\n [1, 0, 1],\\n ... \n","5 \n","6 arr = [5, 3, 17, 11, 9] \n","7 < noinput > \n","8 \n","9 string = \" A B C D \" \n","\n"," output split \n","0 arr = [2, 4, 6, 8, 10] 0 \n","1 Height of triangle = opposite side length * si... 0 \n","2 def replace(self, replace_with):\\n new_stri... 0 \n","3 arr = [3, 6, 9, 12, 15, 18, 21, 24, 27, 30, 33... 0 \n","4 def find_num_distinct_states(matrix):\\n sta... 0 \n","5 for i in range(10):\\n for j in range(10):\\n... 0 \n","6 def max_difference(arr):\\n max_diff = 0\\n ... 0 \n","7 def fib(n):\\n if n == 0:\\n return 0\\... 0 \n","8 class Point:\\n def __init__(self, x, y):\\n ... 0 \n","9 def remove_spaces(string): \\n return \"\".joi... 0 "],"text/html":["\n","
\n","
\n","\n","\n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n","
instructioninputoutputsplit
0Create an array of length 5 which contains all...arr = [2, 4, 6, 8, 10]0
1Formulate an equation to calculate the height ...Height of triangle = opposite side length * si...0
2Write a replace method for a string class whic...string = \"Hello World!\"\\nreplace_with = \"Greet...def replace(self, replace_with):\\n new_stri...0
3Create an array of length 15 containing number...arr = [3, 6, 9, 12, 15, 18, 21, 24, 27, 30, 33...0
4Write a function to find the number of distinc...matrix = [[1, 0, 0],\\n [1, 0, 1],\\n ...def find_num_distinct_states(matrix):\\n sta...0
5Create a nested loop to print every combinatio...for i in range(10):\\n for j in range(10):\\n...0
6Write a function to find the maximum differenc...arr = [5, 3, 17, 11, 9]def max_difference(arr):\\n max_diff = 0\\n ...0
7Write a function to generate the nth Fibonacci...< noinput >def fib(n):\\n if n == 0:\\n return 0\\...0
8Write a class to represent a 2D point with x a...class Point:\\n def __init__(self, x, y):\\n ...0
9Write code that removes spaces from a given st...string = \" A B C D \"def remove_spaces(string): \\n return \"\".joi...0
\n","
\n","
\n","\n","
\n"," \n","\n"," \n","\n"," \n","
\n","\n","\n","
\n"," \n","\n","\n","\n"," \n","
\n","
\n","
\n"],"application/vnd.google.colaboratory.module+javascript":"\n import \"https://ssl.gstatic.com/colaboratory/data_table/881c4a0d49046431/data_table.js\";\n\n const table = window.createDataTable({\n data: [[{\n 'v': 0,\n 'f': \"0\",\n },\n\"Create an array of length 5 which contains all even numbers between 1 and 10.\",\n\"\",\n\"arr = [2, 4, 6, 8, 10]\",\n{\n 'v': 0,\n 'f': \"0\",\n }],\n [{\n 'v': 1,\n 'f': \"1\",\n },\n\"Formulate an equation to calculate the height of a triangle given the angle, side lengths and opposite side length.\",\n\"\",\n\"Height of triangle = opposite side length * sin (angle) / side length\",\n{\n 'v': 0,\n 'f': \"0\",\n }],\n [{\n 'v': 2,\n 'f': \"2\",\n },\n\"Write a replace method for a string class which replaces the given string with a given set of characters.\",\n\"string = \\\"Hello World!\\\"\\nreplace_with = \\\"Greetings!\\\"\",\n\"def replace(self, replace_with):\\n new_string = \\\"\\\"\\n for char in self:\\n if char == \\\" \\\":\\n new_string += replace_with\\n else:\\n new_string += char\\n return new_string\",\n{\n 'v': 0,\n 'f': \"0\",\n }],\n [{\n 'v': 3,\n 'f': \"3\",\n },\n\"Create an array of length 15 containing numbers divisible by 3 up to 45.\",\n\"\",\n\"arr = [3, 6, 9, 12, 15, 18, 21, 24, 27, 30, 33, 36, 39, 42, 45]\",\n{\n 'v': 0,\n 'f': \"0\",\n }],\n [{\n 'v': 4,\n 'f': \"4\",\n },\n\"Write a function to find the number of distinct states in a given matrix.\",\n\"matrix = [[1, 0, 0],\\n [1, 0, 1],\\n [1, 1, 1]]\",\n\"def find_num_distinct_states(matrix):\\n states = set()\\n for row in matrix:\\n state = \\\"\\\".join([str(x) for x in row])\\n states.add(state)\\n return len(states)\",\n{\n 'v': 0,\n 'f': \"0\",\n }],\n [{\n 'v': 5,\n 'f': \"5\",\n },\n\"Create a nested loop to print every combination of numbers between 0-9\",\n\"\",\n\"for i in range(10):\\n for j in range(10):\\n print(i, j)\",\n{\n 'v': 0,\n 'f': \"0\",\n }],\n [{\n 'v': 6,\n 'f': \"6\",\n },\n\"Write a function to find the maximum difference between two numbers in a given array.\",\n\"arr = [5, 3, 17, 11, 9]\",\n\"def max_difference(arr):\\n max_diff = 0\\n for i in range(len(arr)-1):\\n diff = arr[i+1] - arr[i]\\n if diff > max_diff:\\n max_diff = diff\\n return max_diff\",\n{\n 'v': 0,\n 'f': \"0\",\n }],\n [{\n 'v': 7,\n 'f': \"7\",\n },\n\"Write a function to generate the nth Fibonacci number.\",\n\"< noinput >\",\n\"def fib(n):\\n if n == 0:\\n return 0\\n elif n == 1:\\n return 1\\n else:\\n return fib(n-2) + fib(n-1)\",\n{\n 'v': 0,\n 'f': \"0\",\n }],\n [{\n 'v': 8,\n 'f': \"8\",\n },\n\"Write a class to represent a 2D point with x and y coordinates.\",\n\"\",\n\"class Point:\\n def __init__(self, x, y):\\n self.x = x \\n self.y = y \\n \\n def __str__(self): \\n return \\\"({0},{1})\\\".format(self.x, self.y)\",\n{\n 'v': 0,\n 'f': \"0\",\n }],\n [{\n 'v': 9,\n 'f': \"9\",\n },\n\"Write code that removes spaces from a given string.\",\n\"string = \\\" A B C D \\\"\",\n\"def remove_spaces(string): \\n return \\\"\\\".join(string.split())\",\n{\n 'v': 0,\n 'f': \"0\",\n }]],\n columns: [[\"number\", \"index\"], [\"string\", \"instruction\"], [\"string\", \"input\"], [\"string\", \"output\"], [\"number\", \"split\"]],\n columnOptions: [{\"width\": \"1px\", \"className\": \"index_column\"}],\n rowsPerPage: 25,\n helpUrl: \"https://colab.research.google.com/notebooks/data_table.ipynb\",\n suppressOutputScrolling: true,\n minimumWidth: undefined,\n });\n\n function appendQuickchartButton(parentElement) {\n let quickchartButtonContainerElement = document.createElement('div');\n quickchartButtonContainerElement.innerHTML = `\n
\n \n \n\n\n \n
`;\n parentElement.appendChild(quickchartButtonContainerElement);\n }\n\n appendQuickchartButton(table);\n "},"metadata":{},"execution_count":7}],"source":["df.head(10)"]},{"cell_type":"code","execution_count":null,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":2,"status":"ok","timestamp":1703888312308,"user":{"displayName":"Yufei Wang","userId":"15670977446030042093"},"user_tz":480},"id":"LS0qhGCvoi3a","outputId":"4b775dcc-1ece-414e-e03b-780687ef7812"},"outputs":[{"output_type":"stream","name":"stdout","text":["Total number of examples in the dataset: 1000\n","47.2% of examples that are self-sufficient\n","52.8% of examples that are need additional context\n"]}],"source":["num_self_sufficient = (df['input'] == '').sum()\n","num_need_context = df.shape[0] - num_self_sufficient\n","\n","print(f\"Total number of examples in the dataset: {df.shape[0]}\")\n","\n","print(f\"{round(num_self_sufficient/df.shape[0] * 100, 2)}% of examples that are self-sufficient\")\n","print(f\"{round(num_need_context/df.shape[0] * 100, 2)}% of examples that are need additional context\")"]},{"cell_type":"code","execution_count":null,"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":523},"executionInfo":{"elapsed":799,"status":"ok","timestamp":1703888314371,"user":{"displayName":"Yufei Wang","userId":"15670977446030042093"},"user_tz":480},"id":"TjjSCoZIpB8i","outputId":"6fcdfc0f-0359-4976-a4ea-b5e865d79a20"},"outputs":[{"output_type":"stream","name":"stdout","text":["Average number of tokens in the instruction column: 23\n","Average number of tokens in the input column: 8\n","Average number of tokens in the output column: 65\n","\n"]},{"output_type":"display_data","data":{"text/plain":["
"],"image/png":"\n"},"metadata":{}}],"source":["# Calculating the length of each cell in each column\n","df['num_characters_instruction'] = df['instruction'].apply(lambda x: len(x))\n","df['num_characters_input'] = df['input'].apply(lambda x: len(x))\n","df['num_characters_output'] = df['output'].apply(lambda x: len(x))\n","\n","# Show Distribution\n","df.hist(column=['num_characters_instruction', 'num_characters_input', 'num_characters_output'])\n","\n","# Calculating the average\n","average_chars_instruction = df['num_characters_instruction'].mean()\n","average_chars_input = df['num_characters_input'].mean()\n","average_chars_output = df['num_characters_output'].mean()\n","\n","print(f'Average number of tokens in the instruction column: {(average_chars_instruction / 3):.0f}')\n","print(f'Average number of tokens in the input column: {(average_chars_input / 3):.0f}')\n","print(f'Average number of tokens in the output column: {(average_chars_output / 3):.0f}', end=\"\\n\\n\")"]},{"cell_type":"code","execution_count":null,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":322,"status":"ok","timestamp":1703808189674,"user":{"displayName":"Yufei Wang","userId":"15670977446030042093"},"user_tz":480},"id":"-mpSiGGHrWme","outputId":"bc66852a-cedc-4db7-ea71-40b0860a082d"},"outputs":[{"data":{"text/plain":["(898, 3)"]},"execution_count":16,"metadata":{},"output_type":"execute_result"}],"source":["df[df['split'] == 0][['instruction', 'input',\t'output']].shape"]},{"cell_type":"code","execution_count":null,"metadata":{"id":"KRjyPoE_sRBU"},"outputs":[],"source":["json_result = df[df['split'] == 0][['instruction', 'input',\t'output']].to_json(orient='records')"]},{"cell_type":"code","execution_count":null,"metadata":{"id":"UAOgoitzsrxn"},"outputs":[],"source":["with open('training_data.json', 'w') as file:\n"," file.write(json_result)"]},{"cell_type":"code","execution_count":null,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":406,"status":"ok","timestamp":1703808214266,"user":{"displayName":"Yufei Wang","userId":"15670977446030042093"},"user_tz":480},"id":"zuccYgJjsyot","outputId":"907c1d0a-e99c-45d3-b917-135e26858e53"},"outputs":[{"name":"stdout","output_type":"stream","text":["config.json data.json\tmulti-lora-fine-tune sample_data training_data.json\n"]}],"source":["!ls"]},{"cell_type":"markdown","metadata":{"id":"dEKoBKrzqJhu"},"source":["## Fine-tune"]},{"cell_type":"code","execution_count":null,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":5881,"status":"ok","timestamp":1703887815985,"user":{"displayName":"Yufei Wang","userId":"15670977446030042093"},"user_tz":480},"id":"6erZ2lsyqDpn","outputId":"a5d7c818-2053-4550-d192-d72ea3a6cb79"},"outputs":[{"output_type":"stream","name":"stdout","text":["Cloning into 'multi-lora-fine-tune'...\n","remote: Enumerating objects: 1034, done.\u001b[K\n","remote: Counting objects: 100% (453/453), done.\u001b[K\n","remote: Compressing objects: 100% (161/161), done.\u001b[K\n","remote: Total 1034 (delta 323), reused 331 (delta 289), pack-reused 581\u001b[K\n","Receiving objects: 100% (1034/1034), 6.33 MiB | 1.34 MiB/s, done.\n","Resolving deltas: 100% (573/573), done.\n"]}],"source":["!git clone https://github.com/TUDB-Labs/multi-lora-fine-tune.git"]},{"cell_type":"code","execution_count":null,"metadata":{"id":"yJQw3FrEqNCW"},"outputs":[],"source":["!pip install -r multi-lora-fine-tune/requirements.txt"]},{"cell_type":"code","execution_count":null,"metadata":{"id":"kEXjcWRLqRIl"},"outputs":[],"source":["config_string = \"\"\"\n","{\n"," \"cutoff_len\": 256,\n"," \"group_by_length\": false,\n"," \"expand_right\": true,\n"," \"pad_token_id\": -1,\n"," \"save_step\": 2000,\n"," \"early_stop_test_step\": 2000,\n"," \"train_lora_candidate_num\": 4,\n"," \"train_lora_simultaneously_num\": 2,\n"," \"train_strategy\": \"optim\",\n"," \"lora\": [\n"," {\n"," \"name\": \"lora_0\",\n"," \"output\": \"lora_0\",\n"," \"optim\": \"adamw\",\n"," \"lr\": 3e-4,\n"," \"batch_size\": 16,\n"," \"micro_batch_size\": 4,\n"," \"test_batch_size\": 64,\n"," \"num_epochs\": 30,\n"," \"r\": 8,\n"," \"alpha\": 16,\n"," \"dropout\": 0.05,\n"," \"target_modules\": {\n"," \"q_proj\": true,\n"," \"k_proj\": false,\n"," \"v_proj\": true,\n"," \"o_proj\": false,\n"," \"w1_proj\": false,\n"," \"w2_proj\": false,\n"," \"w3_proj\": false\n"," },\n"," \"data\": \"training_data.json\",\n"," \"prompt\": \"multi-lora-fine-tune/template/template_demo.json\"\n"," },\n"," {\n"," \"name\": \"lora_1\",\n"," \"output\": \"lora_1\",\n"," \"optim\": \"adamw\",\n"," \"lr\": 3e-4,\n"," \"batch_size\": 16,\n"," \"micro_batch_size\": 4,\n"," \"test_batch_size\": 64,\n"," \"num_epochs\": 1,\n"," \"r\": 8,\n"," \"alpha\": 16,\n"," \"dropout\": 0.05,\n"," \"target_modules\": {\n"," \"q_proj\": true,\n"," \"k_proj\": false,\n"," \"v_proj\": true,\n"," \"o_proj\": false,\n"," \"w1_proj\": false,\n"," \"w2_proj\": false,\n"," \"w3_proj\": false\n"," },\n"," \"data\": \"multi-lora-fine-tune/data/data_demo.json\",\n"," \"prompt\": \"multi-lora-fine-tune/template/template_demo.json\"\n"," }\n"," ]\n","}\n","\"\"\"\n","\n","with open(\"./config.json\", \"w\") as f:\n"," f.write(config_string)\n"]},{"cell_type":"code","execution_count":null,"metadata":{"colab":{"background_save":true},"id":"MSlAyiJetEgy"},"outputs":[],"source":["!python multi-lora-fine-tune/mlora.py \\\n"," --base_model openlm-research/open_llama_3b \\\n"," --config config.json"]},{"cell_type":"markdown","metadata":{"id":"Ls8iGBTow0fr"},"source":["## Inference"]},{"cell_type":"code","execution_count":null,"metadata":{"id":"365__VkJw3q-","colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"status":"ok","timestamp":1703887700168,"user_tz":480,"elapsed":3257,"user":{"displayName":"Yufei Wang","userId":"15670977446030042093"}},"outputId":"a91ce7f0-2d3c-4fb6-97a5-772771122e7e"},"outputs":[{"output_type":"stream","name":"stdout","text":["Mounted at /content/gdrive\n"]}],"source":["from google.colab import drive\n","drive.mount('/content/gdrive')"]},{"cell_type":"code","source":["!ls /content/gdrive/MyDrive"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"qF0wPXQdnpkQ","executionInfo":{"status":"ok","timestamp":1703887725085,"user_tz":480,"elapsed":5,"user":{"displayName":"Yufei Wang","userId":"15670977446030042093"}},"outputId":"57991fe2-4166-4dad-c6ad-52cef0c64e05"},"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":[" aclImdb\t\t\t\t\t\t Notability\n","'Colab Notebooks'\t\t\t\t\t 'Notability (1)'\n"," data\t\t\t\t\t\t\t 'Notability (2)'\n"," data.xlsx\t\t\t\t\t\t stop_words.txt\n","'History courses info'\t\t\t\t\t transcript.pdf\n","'Instagram Likes Classification Project Summary.gslides' 'Yufei Wang - CV_V6.pdf'\n"," lora_0\n"]}]},{"cell_type":"code","source":["!pip install peft"],"metadata":{"id":"m5iFzwIinB7K"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["from peft import PeftModel\n","from transformers import GenerationConfig, LlamaForCausalLM, LlamaTokenizer\n","import torch"],"metadata":{"id":"sGXOOCcnnCWT"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["base_model = 'openlm-research/open_llama_3b'\n","lora_weights = '/content/gdrive/MyDrive/lora_0'\n","\n","tokenizer = LlamaTokenizer.from_pretrained(base_model)\n","model = LlamaForCausalLM.from_pretrained(\n"," base_model,\n"," load_in_8bit=True,\n"," torch_dtype=torch.float16,\n"," device_map=\"cuda:0\",\n",")\n","model = PeftModel.from_pretrained(\n"," model,\n"," lora_weights,\n"," torch_dtype=torch.float16,\n",")"],"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":209,"referenced_widgets":["4fa918c5a8f849cd812ac83ec7fe2f1e","6bfaee2361b646a5a21c2ae5e1023257","efcf8af77a114e74aaff95a20438702a","0dd4b00f793742eca9f87d73712e0b0e","6968c61c31604aca80e5745daaaf7ef6","500144acbc8c4fa1b06f026320ba8844","d98f83b1034d44ce84d2d133134d627c","287a2d39097c4e3ea09866f1340293dc","c1af2047df5d41ae8a6d0e0579a888cf","44414614da424efd8aac1788111a1d74","4191aaf7508840ceb0edbe05ed5d55fd","2ec956ffc8af48ea9c2ed605b9a1232a","9adda1cb7776459487337c79cd8de2ec","f6fce7b0d0d14b2b896b53c982173658","3460185852014621b82f51e14e0d4311","b43003bd11e5487f8f3f6957ffba03c8","cf9827ba6c814668816ae1501755ae4c","1187729f2eb947ec8c9fb5c44d5f4c6a","cfa193662e0c4f7b8d66c0ebc255a781","5b0c4e5306d244dfb16cc34ef70fc9a5","c7a6752ad86d4cb0b02e4638659e389a","85866eb60ef3492582cc2e373748010a","fef1536a9ec9495cb9a3582564cae4cc","7c85981816a04a7db6d71266d790ff2a","dff5f6a0ce3448d8846312716cebeb2c","515e810367c24f0687bd744303eb80fb","c0a01985d43b4a47a004eef011844308","3416a9c05e504b5f9fa69c852f1304b0","1d55b6f3bda446e797b0858e6db59d67","15b832b3cfe64f80a4d90053520ea985","1339381ed22e4350b9f6dcf65cf0f358","e15c5a3c547b436f827cc8552f2d2615","1d57926c94284cf8a9f524189023123a","d272281fa4ca48bb8d902408bb6897fc","4840bd8c3101481bbb0e12b9dacec08b","143717384ab544038e5952fbef276e8c","77937929d9f04aa6a07b240aed165ce8","e99fc782ccc04610b7dbfa40ae5f4c09","9ee756f4a494461eb8973268657cc4d9","5152e80bee06480b9de3d54ddd302705","8c6fed8ed357422cb4eb8593c2372624","0e323895b54f42619f153c610d98133e","2695a39b12e340f8985c5d22c09dbe6d","8e5be166caf744a5b754817c7a31f9bf","51d03f632f1042d5a1dab3d2bfa51a14","e81913c8e9214d29953fd4e021391d0d","b7723546836e45fb978de0dd907329e9","8ae07af1f213483da91759986df99abc","a41e518f1449498b839e9b73539d169f","b9168e27f69b405d885a94e1801bf7c1","b51b668afdbc4a5488513853b94b760b","7e827c582b1c45f392cde01d5e05b643","b9d1e2f19c334f3b96e97c9b318d9468","58fb40eb4c994e38bbbf441ea274cc25","fc514bcf67f0418891792e51f30b73af","3606fa920d1f4d60872e739f4ca9b7ad","7fbd2ed58abe422dab2ee763ccc150c5","7f5d53cd9fae4bc5882bd8f1e0b3e3af","942df0378c62436a932e6ac57e388b7a","628020138bfc43e98b410d3226a47e35","b00c24c6257a42baa45934eb2120af32","3c283f77ce5b424e9829881d43327482","808740bdd78542a89da085a8eb946763","414bb5d9b41d46c6a3a6d819b9c35f24","25a6399de4db4ae4b32a012736115f8b","ab5411ad9d7a4ec7b5f3833ae24675b9"]},"id":"653kdOManF1r","executionInfo":{"status":"ok","timestamp":1703888258080,"user_tz":480,"elapsed":257358,"user":{"displayName":"Yufei Wang","userId":"15670977446030042093"}},"outputId":"21c1ec5a-e018-4b68-969c-f4cb418b68db"},"execution_count":null,"outputs":[{"output_type":"display_data","data":{"text/plain":["tokenizer.model: 0%| | 0.00/534k [00:00 y:\\n ... \n","120 import java.util.Random; \\n \\npublic class Ge... \n","146 SELECT department, COUNT(employee_ID)\\nFROM em... \n","153 SELECT SUM(CASE WHEN gender = 'female' THEN sa... \n","170 // Algorithm to find the largest element in an... \n","203 \"\"\"\\nWrite a code to find the maximum in a giv... \n","212 \"\"\"\\nCreate a program to compute the checksum ... \n","249 import mysql.connector\\n\\nmydb = mysql.connect... \n","253 def calculator():\\n number1 = int(input(\"Pl... \n","257 mylist = [x for x in mylist if x % 3 == 0] \n","313 def greet_user(name):\\n \"\"\"\\n Greet the ... \n","327 def multiply(x,y):\\n if(y == 0):\\n return ... \n","344
\\n
\\n \n","
\n","\n","\n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n","
instructioninputoutput
34Create a JSX code that renders a \"Hello, World...import React from \"react\";\\n\\nfunction App() {...
58Generate a random number between 0 and 1 (incl...Math.random(); // a random number between 0 an...
96Create a quick-sort algorithm in Python.def quick_sort(arr):\\n \"\"\"Sort a list of nu...
99Write a function that takes in a list of numbe...list = [8, 2, 14, 25]def find_greatest(list):\\n \"\"\"Print out the...
109Create a function to calculate the maximum of ...def max_of_two(x, y):\\n if x > y:\\n ...
120Write a Java program to generate random numbersimport java.util.Random; \\n \\npublic class Ge...
146Write an SQL query to select the number of emp...SELECT department, COUNT(employee_ID)\\nFROM em...
153Write an SQL query to calculate the difference...SELECT SUM(CASE WHEN gender = 'female' THEN sa...
170Write an algorithm to find the largest element...[8, 11, 12, 5, 3]// Algorithm to find the largest element in an...
203Write a code to find the maximum in a given li...mylist = [1,2,3,4,5]\"\"\"\\nWrite a code to find the maximum in a giv...
212Create a program to compute the checksum of a ...data_packet = [0xff, 0x0a, 0x1b, 0x3f]\"\"\"\\nCreate a program to compute the checksum ...
249Connect to a MySQL database and select all row...import mysql.connector\\n\\nmydb = mysql.connect...
253Write a simple calculator program.def calculator():\\n number1 = int(input(\"Pl...
257Change the following array so that it only con...mylist = [2, 4, 5, 6, 7, 11, 12, 22]mylist = [x for x in mylist if x % 3 == 0]
313Create a program which will take the user's na...name = 'John'def greet_user(name):\\n \"\"\"\\n Greet the ...
327Write a code to multiple two numbers without u...def multiply(x,y):\\n if(y == 0):\\n return ...
344Create an HTML form with radio buttons for sel...<form>\\n <label>Gender:</label><br>\\n <input...
382Write a Python code snippet to print the pyram...4* \\n ***\\n *****\\n *******
398Write a Python function to check if a given st...word1 = \"cat\"\\nword2 = \"tac\"def is_anagram(word1, word2):\\n return sorted(...
404Describe how to debug a C++ program using GDB.Debugging a C++ program using GDB involves run...
432Write a Python script to find the common eleme...list1 = [1, 2, 3, 5, 7]\\nlist2 = [2, 3, 4, 5, 6]def common_elements(list1, list2):\\n common...
440Create a function to convert a given number fr...def dec_to_binary(num):\\n binary = \"\"\\n ...
442Implement a Java program for finding the index...public int binarySearch(int[] arr, int val){\\n...
449Write a SQL query to join two tables on a spec...Table 1:\\nid name age\\n1 a 15\\n2 ...SELECT table1.id, table1.name, table1.age, tab...
466Describe the details of the try-except stateme...The try-except statement in Python is used to ...
482Convert the following code from Swift to Java.let age = 25int age = 25;
527Create an array in Java with 10 floating-point...// Create an array \\nfloat arr[] = {1.1, 2.2, ...
552Create a binary search tree in JavaScript.class Node { \\n constructor(data) \\n { \\n ...
562Write a code to find the square of the first n...def square_of_first_n_number(n):\\n \"\"\"Find ...
624Perform a linear search in a list named 'mylis...mylist = [1, 2, 3, 4, 5, 6, 7]\\ntarget = 4def linear_search(mylist, target):\\n for i in ...
643Build a deep learning model in Python to predi...# import libraries\\nimport numpy as np\\nimport...
645Write a JavaScript function to sort an array o...function sortArray(arr) {\\n return arr.sort(fu...
655Create a loop in JavaScript that prints the nu...for (let i = 1; i <= 10; i++) {\\n console.l...
662Calculate the factorial of a given number.The number is 75040
697Describe how to add an element in a linked lis...// To add an element in a linked list in Pytho...
718What is the purpose of the \"break\" keyword in ...The \"break\" keyword is used to immediately bre...
745Concatenate the two strings below, with a spac...A = \"Hello\"\\nB = \"World!\"A + ' ' + B
750Write a bash script to list the content of the...#!/bin/bash\\n\\nls
751Create a JavaScript object to represent a pers...let person = {\\n name: \"John Doe\",\\n age: 25...
768Write a SQL query to select the row with the c...SELECT * FROM customers WHERE customer_id = 'C...
776Write a JavaScript code to add two numbers usi...let a = prompt('Enter the first number:');\\nle...
779Edit the provided CSS rule to make all element....myClass { \\n font-size: 16px;\\n}.myClass { \\n font-size: 16px;\\n font-weight...
813Write a method that prints out a square of siz...n=5public static void printSquare(int n) { \\n ...
836Rewrite the following SQL query so that it pro...SELECT * FROM Orders WHERE OrderId IN (SELECT ...SELECT Orders.* \\nFROM Orders \\nINNER JOIN Ord...
838Create an array of ten unique numbers within t...int[] numbers = {10, 13, 16, 23, 25, 37, 41, 4...
877You should create a Java program to implement ...public class BinarySearch \\n{ \\n // Returns...
903Write a SQL query to retrieve all the rows fro...SELECT * FROM customers;
910You are given a list of numbers. Write a progr...[1, 2, 3, 2, 1]def is_palindrome(arr):\\n rev_arr = arr[::-1]...
922Generate a string of 5 random characters from ...import random\\n\\ndef random_string():\\n cha...
964Create a neural network in Python to recognize...MNIST hand-written digit datasetThe code to create a neural network in Python ...
981Write a database query to retrieve the names o...SELECT name \\nFROM authors;
\n","
\n","
\n","\n","
\n"," \n","\n"," \n","\n"," \n","
\n","\n","\n","
\n"," \n","\n","\n","\n"," \n","
\n","
\n"," \n"],"application/vnd.google.colaboratory.module+javascript":"\n import \"https://ssl.gstatic.com/colaboratory/data_table/881c4a0d49046431/data_table.js\";\n\n const table = window.createDataTable({\n data: [[{\n 'v': 34,\n 'f': \"34\",\n },\n\"Create a JSX code that renders a \\\"Hello, World!\\\" message in the browser.\",\n\"\",\n\"import React from \\\"react\\\";\\n\\nfunction App() {\\n return (\\n
\\n

Hello, World!<\\/h1>\\n <\\/div>\\n );\\n}\\n\\nexport default App;\"],\n [{\n 'v': 58,\n 'f': \"58\",\n },\n\"Generate a random number between 0 and 1 (inclusively).\",\n\"\",\n\"Math.random(); // a random number between 0 and 1 (inclusively)\"],\n [{\n 'v': 96,\n 'f': \"96\",\n },\n\"Create a quick-sort algorithm in Python.\",\n\"\",\n\"def quick_sort(arr):\\n \\\"\\\"\\\"Sort a list of numbers in ascending order using the Quick-Sort algorithm\\\"\\\"\\\"\\n if len(arr) == 0:\\n return []\\n\\n pivot = arr[0]\\n left_arr = [x for x in arr if x < pivot]\\n right_arr = [x for x in arr if x > pivot]\\n return quick_sort(left_arr) + [pivot] + quick_sort(right_arr)\"],\n [{\n 'v': 99,\n 'f': \"99\",\n },\n\"Write a function that takes in a list of numbers and prints out the greatest number.\",\n\"list = [8, 2, 14, 25]\",\n\"def find_greatest(list):\\n \\\"\\\"\\\"Print out the greatest number from a list of numbers.\\\"\\\"\\\"\\n greatest = list[0]\\n for num in list:\\n if num > greatest:\\n greatest = num\\n print('The greatest number is: ', greatest)\"],\n [{\n 'v': 109,\n 'f': \"109\",\n },\n\"Create a function to calculate the maximum of two numbers.\",\n\"\",\n\"def max_of_two(x, y):\\n if x > y:\\n return x\\n else:\\n return y\"],\n [{\n 'v': 120,\n 'f': \"120\",\n },\n\"Write a Java program to generate random numbers\",\n\"\",\n\"import java.util.Random; \\n \\npublic class GenerateRandom { \\n \\n public static void main(String[] args) \\n { \\n \\n Random rand = new Random(); \\n \\n // Generate random integers in range 0 to 999 \\n int x = rand.nextInt(1000); \\n System.out.println(\\\"Random Integers: \\\" + x); \\n \\n // Generate Random doubles \\n double y = rand.nextDouble(); \\n System.out.println(\\\"Random Doubles: \\\" + y); \\n \\n // Generate Random Boolean \\n boolean z = rand.nextBoolean(); \\n System.out.println(\\\"Random Boolean: \\\" + z); \\n } \\n}\"],\n [{\n 'v': 146,\n 'f': \"146\",\n },\n\"Write an SQL query to select the number of employees in each department, sorted by the department name in ascending order.\",\n\"\",\n\"SELECT department, COUNT(employee_ID)\\nFROM employees\\nGROUP BY department\\nORDER BY department ASC;\"],\n [{\n 'v': 153,\n 'f': \"153\",\n },\n\"Write an SQL query to calculate the difference between the total salaries of male and female employees in a table.\",\n\"\",\n\"SELECT SUM(CASE WHEN gender = 'female' THEN salary ELSE 0 END) - SUM(CASE WHEN gender = 'male' THEN salary ELSE 0 END)\\nFROM employees;\"],\n [{\n 'v': 170,\n 'f': \"170\",\n },\n\"Write an algorithm to find the largest element in an array.\",\n\"[8, 11, 12, 5, 3]\",\n\"// Algorithm to find the largest element in an array\\n\\n// Step 1: Create a variable 'max' and initialize it with value of the first element in the array\\nint max = arr[0];\\n\\n// Step 2: Iterate through the array and compare each element with 'max'\\nfor (int i = 1; i < arr.length; i++) {\\n if (arr[i] > max) {\\n max = arr[i];\\n }\\n}\\n\\n// Step 3: Return the value of 'max'\\nreturn max;\"],\n [{\n 'v': 203,\n 'f': \"203\",\n },\n\"Write a code to find the maximum in a given list of integers.\",\n\"mylist = [1,2,3,4,5]\",\n\"\\\"\\\"\\\"\\nWrite a code to find the maximum in a given list of integers\\n\\\"\\\"\\\"\\n\\n# List containing the elements\\nmylist = [1,2,3,4,5]\\n\\n# Finding the maximum element\\nmax = mylist[0]\\n\\n# Looping through each element to find if it is the maximum\\nfor i in range(1,len(mylist)):\\n # Comparing the element with the maximum\\n if mylist[i] > max:\\n max = mylist[i]\\n\\n# Printing the maximum element\\nprint(\\\"Maximum element of the list is\\\", max)\"],\n [{\n 'v': 212,\n 'f': \"212\",\n },\n\"Create a program to compute the checksum of a given data packet\",\n\"data_packet = [0xff, 0x0a, 0x1b, 0x3f]\",\n\"\\\"\\\"\\\"\\nCreate a program to compute the checksum of a given data packet\\n\\\"\\\"\\\"\\n\\ndef compute_checksum(data_packet):\\n checksum = 0\\n for x in data_packet:\\n checksum += x\\n return checksum\\n\\nif __name__ == '__main__':\\n data_packet = [0xff, 0x0a, 0x1b, 0x3f]\\n print(compute_checksum(data_packet))\"],\n [{\n 'v': 249,\n 'f': \"249\",\n },\n\"Connect to a MySQL database and select all rows from Customers where Phone is greater than 1000.\",\n\"\",\n\"import mysql.connector\\n\\nmydb = mysql.connector.connect(\\n host=\\\"localhost\\\",\\n user=\\\"\\\",\\n passwd=\\\"\\\",\\n database=\\\"mydatabase\\\"\\n)\\n\\nmycursor = mydb.cursor()\\n\\nmycursor.execute(\\\"SELECT * FROM customers WHERE phone > 1000\\\")\\n\\nmyresult = mycursor.fetchall()\\n\\nfor x in myresult:\\n print(x)\"],\n [{\n 'v': 253,\n 'f': \"253\",\n },\n\"Write a simple calculator program.\",\n\"\",\n\"def calculator():\\n number1 = int(input(\\\"Please enter first number: \\\"))\\n number2 = int(input(\\\"Please enter second number: \\\"))\\n print(\\\"Please choose operation -\\\\n\\\" \\\\\\n \\\"1. Add\\\\n\\\" \\\\\\n \\\"2. Subtract\\\\n\\\" \\\\\\n \\\"3. Multiply\\\\n\\\" \\\\\\n \\\"4. Divide\\\\n\\\") \\n\\n choice = int(input(\\\"Enter your choice: \\\"))\\n if choice == 1:\\n ans = number1 + number2\\n print(\\\"Answer={}\\\".format(ans))\\n elif choice == 2:\\n ans = number1 - number2\\n print(\\\"Answer={}\\\".format(ans))\\n elif choice == 3:\\n ans = number1 * number2\\n print(\\\"Answer={}\\\".format(ans))\\n elif choice == 4:\\n ans = number1 / number2\\n print(\\\"Answer={}\\\".format(ans))\\n else:\\n print(\\\"Invalid Choice\\\")\"],\n [{\n 'v': 257,\n 'f': \"257\",\n },\n\"Change the following array so that it only contains numbers divisible by 3\",\n\"mylist = [2, 4, 5, 6, 7, 11, 12, 22]\",\n\"mylist = [x for x in mylist if x % 3 == 0]\"],\n [{\n 'v': 313,\n 'f': \"313\",\n },\n\"Create a program which will take the user's name and output a custom message depending on the supplied name\",\n\"name = 'John'\",\n\"def greet_user(name):\\n \\\"\\\"\\\"\\n Greet the user with a custom message depending on the supplied name.\\n \\\"\\\"\\\"\\n if name == 'John':\\n print('Hey there John! Welcome back!')\\n elif name == 'Mary':\\n print('Good morning Mary! How are you doing today?')\\n else:\\n print('Hi there! Welcome to our service!')\"],\n [{\n 'v': 327,\n 'f': \"327\",\n },\n\"Write a code to multiple two numbers without using the multiplication operator.\",\n\"\",\n\"def multiply(x,y):\\n if(y == 0):\\n return 0\\n return x + multiply(x,y-1)\\n\\nmultiply(5,4) # 20\"],\n [{\n 'v': 344,\n 'f': \"344\",\n },\n\"Create an HTML form with radio buttons for selecting gender.\",\n\"\",\n\"\\n