当前位置: 首页 > wzjs >正文

泉州网站制作多少钱网站服务器搭建与管理

泉州网站制作多少钱,网站服务器搭建与管理,如何做淘外网站推广,体育建设网站首页【2025】Datawhale AI春训营-蛋白质预测(AI生命科学)-Task2笔记 本文对Task2使用的代码进行理解。 任务描述 Task2的任务仍然是通过对反应中包含的蛋白质残基信息,运用深度学习模型构建蛋白质3D结构的隐式模型,从而达成准确预测…

【2025】Datawhale AI春训营-蛋白质预测(AI+生命科学)-Task2笔记

本文对Task2使用的代码进行理解。

任务描述

Task2的任务仍然是通过对反应中包含的蛋白质残基信息,运用深度学习模型构建蛋白质3D结构的隐式模型,从而达成准确预测蛋白质内在无序区域(IDRs)的目的。任务的评价指标是实验真实结果和预测结果的F1 score。

代码理解

1、导入模块

import argparse
import math
import pickleimport torch
import torch.nn as nn
import torch.nn.functional as Ffrom tqdm import tqdm
from omegaconf import OmegaConf
from sklearn.metrics import f1_score
from torch.utils.data import Dataset, DataLoader
from torch.nn import TransformerEncoderLayer, TransformerEncoder

2、定义氨基酸类型

restypes = ['A', 'R', 'N', 'D', 'C','Q', 'E', 'G', 'H', 'I','L', 'K', 'M', 'F', 'P','S', 'T', 'W', 'Y', 'V'
]
unsure_restype = 'X'
unknown_restype = 'U'

3、定义数据集创建方法

def make_dataset(data_config, train_rate=0.7, valid_rate=0.2):data_path = data_config.data_pathwith open(data_path, 'rb') as f:data = pickle.load(f)total_number = len(data)train_sep = int(total_number * train_rate)valid_sep = int(total_number * (train_rate + valid_rate))train_data_dicts = data[:train_sep]valid_data_dicts = data[train_sep:valid_sep]test_data_dicts = data[valid_sep:]train_dataset = DisProtDataset(train_data_dicts)valid_dataset = DisProtDataset(valid_data_dicts)test_dataset = DisProtDataset(test_data_dicts)return train_dataset, valid_dataset, test_dataset

4、定义数据集

class DisProtDataset(Dataset):def __init__(self, dict_data):sequences = [d['sequence'] for d in dict_data]labels = [d['label'] for d in dict_data]assert len(sequences) == len(labels)self.sequences = sequencesself.labels = labelsself.residue_mapping = {'X':20}self.residue_mapping.update(dict(zip(restypes, range(len(restypes)))))def __len__(self):return len(self.sequences)def __getitem__(self, idx):sequence = torch.zeros(len(self.sequences[idx]), len(self.residue_mapping))for i, c in enumerate(self.sequences[idx]):if c not in restypes:c = 'X'sequence[i][self.residue_mapping[c]] = 1label = torch.tensor([int(c) for c in self.labels[idx]], dtype=torch.long)return sequence, label

5、定义位置编码类

class PositionalEncoding(nn.Module):def __init__(self, d_model, dropout=0.0, max_len=40):super().__init__()position = torch.arange(max_len).unsqueeze(1)div_term = torch.exp(torch.arange(0, d_model, 2) * (-math.log(10000.0) / d_model))pe = torch.zeros(1, max_len, d_model)pe[0, :, 0::2] = torch.sin(position * div_term)pe[0, :, 1::2] = torch.cos(position * div_term)self.register_buffer("pe", pe)self.dropout = nn.Dropout(p=dropout)def forward(self, x):if len(x.shape) == 3:x = x + self.pe[:, : x.size(1)]elif len(x.shape) == 4:x = x + self.pe[:, :x.size(1), None, :]return self.dropout(x)

6、定义模型

class DisProtModel(nn.Module):def __init__(self, model_config):super().__init__()self.d_model = model_config.d_modelself.n_head = model_config.n_headself.n_layer = model_config.n_layerself.input_layer = nn.Linear(model_config.i_dim, self.d_model)self.position_embed = PositionalEncoding(self.d_model, max_len=20000)self.input_norm = nn.LayerNorm(self.d_model)self.dropout_in = nn.Dropout(p=0.1)encoder_layer = TransformerEncoderLayer(d_model=self.d_model,nhead=self.n_head,activation='gelu',batch_first=True)self.transformer = TransformerEncoder(encoder_layer, num_layers=self.n_layer)self.output_layer = nn.Sequential(nn.Linear(self.d_model, self.d_model),nn.GELU(),nn.Dropout(p=0.1),nn.Linear(self.d_model, model_config.o_dim))def forward(self, x):x = self.input_layer(x)x  = self.position_embed(x)x = self.input_norm(x)x = self.dropout_in(x)x = self.transformer(x)x = self.output_layer(x)return x

7、定义指标评估方法

def metric_fn(pred, gt):pred = pred.detach().cpu()gt = gt.detach().cpu()pred_labels = torch.argmax(pred, dim=-1).view(-1)gt_labels = gt.view(-1)score = f1_score(y_true=gt_labels, y_pred=pred_labels, average='micro')return score

8、定义主函数

if __name__ == '__main__':device = 'cuda' if torch.cuda.is_available() else 'cpu'parser = argparse.ArgumentParser('IDRs prediction')parser.add_argument('--config_path', default='./config.yaml')args = parser.parse_args()config = OmegaConf.load(args.config_path)train_dataset, valid_dataset, test_dataset = make_dataset(config.data)train_dataloader = DataLoader(dataset=train_dataset, **config.train.dataloader)valid_dataloader = DataLoader(dataset=valid_dataset, batch_size=1, shuffle=False)model = DisProtModel(config.model)model = model.to(device)optimizer = torch.optim.AdamW(model.parameters(),lr=config.train.optimizer.lr,weight_decay=config.train.optimizer.weight_decay)loss_fn = nn.CrossEntropyLoss()model.eval()metric = 0.with torch.no_grad():for sequence, label in valid_dataloader:sequence = sequence.to(device)label = label.to(device)pred = model(sequence)metric += metric_fn(pred, label)print("init f1_score:", metric / len(valid_dataloader))for epoch in range(config.train.epochs):# train loopprogress_bar = tqdm(train_dataloader,initial=0,desc=f"epoch:{epoch:03d}",)model.train()total_loss = 0.for sequence, label in progress_bar:sequence = sequence.to(device)label = label.to(device)pred = model(sequence)loss = loss_fn(pred.permute(0, 2, 1), label)progress_bar.set_postfix(loss=loss.item())total_loss += loss.item()optimizer.zero_grad()loss.backward()optimizer.step()avg_loss = total_loss / len(train_dataloader)# valid loopmodel.eval()metric = 0.with torch.no_grad():for sequence, label in valid_dataloader:sequence = sequence.to(device)label = label.to(device)pred = model(sequence)metric += metric_fn(pred, label)print(f"avg_training_loss: {avg_loss}, f1_score: {metric / len(valid_dataloader)}")# 保存当前 epoch 的模型save_path = f"model.pkl"torch.save(model.state_dict(), save_path)print(f"Model saved to {save_path}")
http://www.dtcms.com/wzjs/437231.html

相关文章:

  • 便宜做网站的公司靠谱吗企业网站建设方案书
  • 独立网站如何做推广广州企业网站推广
  • 网站舆情监控怎么做网站统计系统
  • 青岛优化网站诊断搜索引擎优化期末考试答案
  • 伪装学渣无极网站seo外链推广
  • 神华科技 网站建设seo优化案例
  • 动态网站如何做软文推广的好处
  • 网站h1标签怎么做bt最佳磁力搜索引擎吧
  • 网站精准ip接口怎么做cfa一级看多久两分钟
  • ps企业网站模板免费下载离我最近的广告公司
  • 盱眙有做网站开发的吗常州网站seo
  • php动态网站开发案例教程pdf广州从化发布
  • 临沂网站建设有哪些百度提交网址
  • wordpress iconfontseo优化 搜 盈seo公司
  • 作网站公司发软文是什么意思
  • 做淘宝要用的网站吗sem和seo
  • 徐州 网站建设企业网站seo多少钱
  • 快云助手网站建设视频教程外链网盘源码
  • 梅州站扩建信息发布网站有哪些
  • 网页设计赚钱吗深圳seo培训
  • 广东省网站备案seo实战培训
  • 用代码做一号店网站怎么做安卓手机优化神器
  • 小程序收录wordpress主题杭州seo培训
  • 湖南智能网站建设报价英文外链平台
  • 做ptt有什么好的模板网站3d建模培训学校哪家好
  • 网页制作与网站建设实战大全 光盘接外包项目的网站
  • 郑州网站定制app推广一手单
  • 网站 国外服务器b2b采购平台
  • 代办网站企业备案广告投放平台排名
  • 深圳网站建设开发今日时政新闻