|
@@ -2,7 +2,7 @@
|
|
|
"cells": [
|
|
|
{
|
|
|
"cell_type": "markdown",
|
|
|
- "id": "theoretical-diary",
|
|
|
+ "id": "posted-subcommittee",
|
|
|
"metadata": {},
|
|
|
"source": [
|
|
|
"# Monitor GPT training performance with varying config\n",
|
|
@@ -48,7 +48,7 @@
|
|
|
},
|
|
|
{
|
|
|
"cell_type": "markdown",
|
|
|
- "id": "gross-macro",
|
|
|
+ "id": "turned-lender",
|
|
|
"metadata": {},
|
|
|
"source": [
|
|
|
"---\n",
|
|
@@ -60,7 +60,7 @@
|
|
|
},
|
|
|
{
|
|
|
"cell_type": "markdown",
|
|
|
- "id": "human-classics",
|
|
|
+ "id": "controlling-advertiser",
|
|
|
"metadata": {},
|
|
|
"source": [
|
|
|
"---\n",
|
|
@@ -72,7 +72,7 @@
|
|
|
},
|
|
|
{
|
|
|
"cell_type": "markdown",
|
|
|
- "id": "finnish-think",
|
|
|
+ "id": "improving-speech",
|
|
|
"metadata": {},
|
|
|
"source": [
|
|
|
"<a id=\"Rerun_Cell\"></a>"
|
|
@@ -81,7 +81,7 @@
|
|
|
{
|
|
|
"cell_type": "code",
|
|
|
"execution_count": 1,
|
|
|
- "id": "saving-locator",
|
|
|
+ "id": "sharing-headline",
|
|
|
"metadata": {},
|
|
|
"outputs": [],
|
|
|
"source": [
|
|
@@ -91,7 +91,7 @@
|
|
|
{
|
|
|
"cell_type": "code",
|
|
|
"execution_count": 2,
|
|
|
- "id": "adverse-genetics",
|
|
|
+ "id": "warming-brooklyn",
|
|
|
"metadata": {},
|
|
|
"outputs": [
|
|
|
{
|
|
@@ -173,19 +173,19 @@
|
|
|
},
|
|
|
{
|
|
|
"cell_type": "markdown",
|
|
|
- "id": "ecological-delaware",
|
|
|
+ "id": "protective-private",
|
|
|
"metadata": {},
|
|
|
"source": [
|
|
|
"---\n",
|
|
|
"## Check how big is your model - \n",
|
|
|
"modify the parameters in the [params_cnt.sh](./params_cnt.sh)\n",
|
|
|
- "I got 6 Billion :) what about you ?"
|
|
|
+ "I got 6.6 Billion :) what about you ?"
|
|
|
]
|
|
|
},
|
|
|
{
|
|
|
"cell_type": "code",
|
|
|
"execution_count": 3,
|
|
|
- "id": "latin-granny",
|
|
|
+ "id": "pretty-laser",
|
|
|
"metadata": {},
|
|
|
"outputs": [
|
|
|
{
|
|
@@ -203,7 +203,7 @@
|
|
|
},
|
|
|
{
|
|
|
"cell_type": "markdown",
|
|
|
- "id": "widespread-sunset",
|
|
|
+ "id": "acknowledged-thinking",
|
|
|
"metadata": {},
|
|
|
"source": [
|
|
|
"---\n",
|
|
@@ -227,7 +227,7 @@
|
|
|
},
|
|
|
{
|
|
|
"cell_type": "markdown",
|
|
|
- "id": "standing-change",
|
|
|
+ "id": "imperial-fellowship",
|
|
|
"metadata": {},
|
|
|
"source": [
|
|
|
"---\n",
|
|
@@ -243,7 +243,7 @@
|
|
|
{
|
|
|
"cell_type": "code",
|
|
|
"execution_count": 4,
|
|
|
- "id": "novel-campbell",
|
|
|
+ "id": "continued-yahoo",
|
|
|
"metadata": {},
|
|
|
"outputs": [
|
|
|
{
|
|
@@ -550,7 +550,7 @@
|
|
|
},
|
|
|
{
|
|
|
"cell_type": "markdown",
|
|
|
- "id": "center-microphone",
|
|
|
+ "id": "available-relaxation",
|
|
|
"metadata": {},
|
|
|
"source": [
|
|
|
"--- \n",
|
|
@@ -564,7 +564,7 @@
|
|
|
},
|
|
|
{
|
|
|
"cell_type": "markdown",
|
|
|
- "id": "basic-horror",
|
|
|
+ "id": "naked-lodge",
|
|
|
"metadata": {},
|
|
|
"source": [
|
|
|
"---\n",
|
|
@@ -574,7 +574,7 @@
|
|
|
},
|
|
|
{
|
|
|
"cell_type": "markdown",
|
|
|
- "id": "recovered-pleasure",
|
|
|
+ "id": "compound-tonight",
|
|
|
"metadata": {},
|
|
|
"source": [
|
|
|
"-----\n",
|