# encoding: utf-8
from gpt_model import GPTConfig, GPTModel
import numpy as np
import sys
import torch
from data_set import load_tokenizerdevice = cuda if torch.cuda.is_available() else cpu
learning_rate = 1e-3
max_iters = 500# 使用numpy的memmap读取数据
tr…