diff --git "a/experiment/rwkv-x-exp/v5-r3-memory/L12-D2048-E1e-1-ctx4k/part1.ipynb" "b/experiment/rwkv-x-exp/v5-r3-memory/L12-D2048-E1e-1-ctx4k/part1.ipynb" --- "a/experiment/rwkv-x-exp/v5-r3-memory/L12-D2048-E1e-1-ctx4k/part1.ipynb" +++ "b/experiment/rwkv-x-exp/v5-r3-memory/L12-D2048-E1e-1-ctx4k/part1.ipynb" @@ -3,13 +3,13 @@ { "attachments": {}, "cell_type": "markdown", - "id": "34787543", + "id": "d16d19a7", "metadata": { "papermill": { - "duration": 0.004045, - "end_time": "2023-09-06T00:20:51.170319", + "duration": 0.004251, + "end_time": "2023-09-06T01:53:47.272181", "exception": false, - "start_time": "2023-09-06T00:20:51.166274", + "start_time": "2023-09-06T01:53:47.267930", "status": "completed" }, "tags": [] @@ -25,13 +25,13 @@ { "attachments": {}, "cell_type": "markdown", - "id": "8aa40f90", + "id": "e7eaa6b5", "metadata": { "papermill": { - "duration": 0.002614, - "end_time": "2023-09-06T00:20:51.175858", + "duration": 0.002635, + "end_time": "2023-09-06T01:53:47.277736", "exception": false, - "start_time": "2023-09-06T00:20:51.173244", + "start_time": "2023-09-06T01:53:47.275101", "status": "completed" }, "tags": [] @@ -43,19 +43,19 @@ { "cell_type": "code", "execution_count": 1, - "id": "53fff9d1", + "id": "43c42c12", "metadata": { "execution": { - "iopub.execute_input": "2023-09-06T00:20:51.180467Z", - "iopub.status.busy": "2023-09-06T00:20:51.180322Z", - "iopub.status.idle": "2023-09-06T00:20:52.066156Z", - "shell.execute_reply": "2023-09-06T00:20:52.065233Z" + "iopub.execute_input": "2023-09-06T01:53:47.281975Z", + "iopub.status.busy": "2023-09-06T01:53:47.281689Z", + "iopub.status.idle": "2023-09-06T01:53:48.160757Z", + "shell.execute_reply": "2023-09-06T01:53:48.159854Z" }, "papermill": { - "duration": 0.890028, - "end_time": "2023-09-06T00:20:52.068428", + "duration": 0.883492, + "end_time": "2023-09-06T01:53:48.162633", "exception": false, - "start_time": "2023-09-06T00:20:51.178400", + "start_time": "2023-09-06T01:53:47.279141", "status": "completed" }, "tags": [] @@ -83,19 +83,19 @@ { "cell_type": "code", "execution_count": 2, - "id": "a388f6e6", + "id": "4f145f3c", "metadata": { "execution": { - "iopub.execute_input": "2023-09-06T00:20:52.076313Z", - "iopub.status.busy": "2023-09-06T00:20:52.076079Z", - "iopub.status.idle": "2023-09-06T00:20:54.167404Z", - "shell.execute_reply": "2023-09-06T00:20:54.166623Z" + "iopub.execute_input": "2023-09-06T01:53:48.169937Z", + "iopub.status.busy": "2023-09-06T01:53:48.169610Z", + "iopub.status.idle": "2023-09-06T01:53:50.281603Z", + "shell.execute_reply": "2023-09-06T01:53:50.280695Z" }, "papermill": { - "duration": 2.097425, - "end_time": "2023-09-06T00:20:54.169133", + "duration": 2.117825, + "end_time": "2023-09-06T01:53:50.283651", "exception": false, - "start_time": "2023-09-06T00:20:52.071708", + "start_time": "2023-09-06T01:53:48.165826", "status": "completed" }, "tags": [] @@ -118,19 +118,19 @@ { "cell_type": "code", "execution_count": 3, - "id": "e2f52f13", + "id": "e478c7e4", "metadata": { "execution": { - "iopub.execute_input": "2023-09-06T00:20:54.176834Z", - "iopub.status.busy": "2023-09-06T00:20:54.176573Z", - "iopub.status.idle": "2023-09-06T00:20:54.185506Z", - "shell.execute_reply": "2023-09-06T00:20:54.184977Z" + "iopub.execute_input": "2023-09-06T01:53:50.291201Z", + "iopub.status.busy": "2023-09-06T01:53:50.290951Z", + "iopub.status.idle": "2023-09-06T01:53:50.300137Z", + "shell.execute_reply": "2023-09-06T01:53:50.299422Z" }, "papermill": { - "duration": 0.014335, - "end_time": "2023-09-06T00:20:54.186704", + "duration": 0.014857, + "end_time": "2023-09-06T01:53:50.301805", "exception": false, - "start_time": "2023-09-06T00:20:54.172369", + "start_time": "2023-09-06T01:53:50.286948", "status": "completed" }, "tags": [] @@ -197,19 +197,19 @@ { "cell_type": "code", "execution_count": 4, - "id": "ff222a35", + "id": "c0d1081e", "metadata": { "execution": { - "iopub.execute_input": "2023-09-06T00:20:54.193945Z", - "iopub.status.busy": "2023-09-06T00:20:54.193803Z", - "iopub.status.idle": "2023-09-06T00:20:54.416273Z", - "shell.execute_reply": "2023-09-06T00:20:54.415523Z" + "iopub.execute_input": "2023-09-06T01:53:50.309388Z", + "iopub.status.busy": "2023-09-06T01:53:50.309130Z", + "iopub.status.idle": "2023-09-06T01:53:50.530630Z", + "shell.execute_reply": "2023-09-06T01:53:50.529804Z" }, "papermill": { - "duration": 0.227953, - "end_time": "2023-09-06T00:20:54.418012", + "duration": 0.227251, + "end_time": "2023-09-06T01:53:50.532377", "exception": false, - "start_time": "2023-09-06T00:20:54.190059", + "start_time": "2023-09-06T01:53:50.305126", "status": "completed" }, "tags": [] @@ -236,13 +236,13 @@ }, { "cell_type": "markdown", - "id": "1f427699", + "id": "ddc1086b", "metadata": { "papermill": { - "duration": 0.003102, - "end_time": "2023-09-06T00:20:54.424585", + "duration": 0.003123, + "end_time": "2023-09-06T01:53:50.538962", "exception": false, - "start_time": "2023-09-06T00:20:54.421483", + "start_time": "2023-09-06T01:53:50.535839", "status": "completed" }, "tags": [] @@ -254,16480 +254,24 @@ { "cell_type": "code", "execution_count": 5, - "id": "e4a7fe9a", + "id": "636df5aa", "metadata": { "execution": { - "iopub.execute_input": "2023-09-06T00:20:54.430076Z", - "iopub.status.busy": "2023-09-06T00:20:54.429584Z", - "iopub.status.idle": "2023-09-06T00:38:40.364127Z", - "shell.execute_reply": "2023-09-06T00:38:40.363334Z" + "iopub.execute_input": "2023-09-06T01:53:50.544775Z", + "iopub.status.busy": "2023-09-06T01:53:50.544524Z", + "iopub.status.idle": "2023-09-06T01:53:59.821234Z", + "shell.execute_reply": "2023-09-06T01:53:59.820428Z" }, "papermill": { - "duration": 1065.938908, - "end_time": "2023-09-06T00:38:40.366018", + "duration": 9.281152, + "end_time": "2023-09-06T01:53:59.823158", "exception": false, - "start_time": "2023-09-06T00:20:54.427110", + "start_time": "2023-09-06T01:53:50.542006", "status": "completed" }, "tags": [] }, "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "Downloading readme: 0%| | 0.00/433 [00:00