submit.py

import os
os.environ['CUDA_VISIBLE_DEVICES'] = '0'

from common import *
from model   import *
from data.dataset import *
from data.dataset import _collate_fn
from data.data import *
from train_old import *
import argparse

def run_submit(out_dir, model, checkpoint):

    model_dict = {'model1': MegnetModel1, 
                  'model2': MegnetModel2}
    
    csv_file = out_dir +'/submit/sub.csv'


    ## setup  -----------------------------------------------------------------------------
    os.makedirs(out_dir +'/checkpoint', exist_ok=True)
    os.makedirs(out_dir +'/submit', exist_ok=True)
    os.makedirs(out_dir +'/backup', exist_ok=True)
    # backup_project_as_zip(PROJECT_PATH, out_dir +'/backup/code.submit.%s.zip'%IDENTIFIER)

    log = Logger()
    log.open(out_dir+'/log.submit.txt',mode='a')
    log.write('\n--- [START %s] %s\n\n' % (IDENTIFIER, '-' * 64))
    log.write('\t%s\n' % COMMON_STRING)
    log.write('\n')


    ## dataset ----------------------------------------
    log.write('** dataset setting **\n')
    batch_size = 64 #*2 #280*2 #256*4 #128 #256 #512  #16 #32

    if 0:## <debug>
        test_dataset = MolecularGraphDataset(
                    mode ='train',
                    csv  ='train',
                    # split='debug_split_by_mol.1000.npy',
                    split='valid_split_by_mol.5000.npy',
                    augment=None,
        )

    #------------
    if 1:
        test_dataset = MolecularGraphDataset(
                    mode ='test',
                    csv  ='test',
                    #split='debug_split_by_mol.1000.npy',
                    split=None,
                    augment=None,
        )
    test_loader  = DataLoader(
                test_dataset,
                sampler     = SequentialSampler(test_dataset),
                #sampler     = RandomSampler(train_dataset),
                batch_size  = batch_size,
                drop_last   = False,
                num_workers = 0,
                pin_memory  = True,
                collate_fn  = _collate_fn
    )

    log.write('batch_size = %d\n'%(batch_size))
    log.write('test_dataset : \n%s\n'%(test_dataset))
    log.write('\n')

    ## net ----------------------------------------
    log.write('** net setting **\n')
    net = model_dict[model]().cuda()

    log.write('\tinitial_checkpoint = %s\n' % checkpoint)
    net.load_state_dict(torch.load(checkpoint, map_location=lambda storage, loc: storage))


    log.write('%s\n'%(type(net)))
    log.write('\n')


    ## start testing here! ##############################################
    test_num = 0
    test_predict = []
    test_coupling_type  = []
    test_coupling_value = []
    test_id = []

    test_loss = 0

    start = timer()
    for b, ([node, edge, state, index1, index2, gnode, gbond, coupling_index, infor], coupling_value) in enumerate(test_loader):

        net.eval()
        with torch.no_grad():
            node = node.cuda()
            edge = edge.cuda()
            state = state.cuda()
            index1 = index1.cuda()
            index2 = index2.cuda()
            gnode = gnode.cuda()
            gbond = gbond.cuda()

            coupling_value = coupling_value.cuda()
            coupling_index = coupling_index.cuda()
            predict = net(node, edge, state, index1, index2, gnode, gbond, coupling_index)
            loss = criterion(predict, coupling_value)

        #---
        batch_size = len(infor)
        test_id.extend(list(np.concatenate([infor[b] for b in range(batch_size)])))

        test_predict.append(predict.data.cpu().numpy())
        test_coupling_type.append(coupling_index[:,2].data.cpu().numpy())
        test_coupling_value.append(coupling_value.data.cpu().numpy())

        test_loss += loss.item()*batch_size
        test_num += batch_size


        print('\r %8d/%8d     %0.2f  %s'%(
            test_num, len(test_dataset),test_num/len(test_dataset),
              time_to_str(timer()-start,'min')),end='',flush=True)


        pass  #-- end of one data loader --
    assert(test_num == len(test_dataset))
    print('\n')

    id  = test_id
    predict  = np.concatenate(test_predict)
    if test_dataset.mode == 'test':
        df = pd.DataFrame(list(zip(id, predict)), columns =['id', 'scalar_coupling_constant'])
        df.to_csv(csv_file,index=False)

        log.write('id        = %d\n'%len(id))
        log.write('predict   = %d\n'%len(predict))
        log.write('csv_file  = %s\n'%csv_file)

    #-------------------------------------------------------------
    # for debug
    if test_dataset.mode == 'train':
        test_loss = test_loss/test_num

        coupling_value = np.concatenate(test_coupling_value)
        coupling_type  = np.concatenate(test_coupling_type).astype(np.int32)

        mae, log_mae = compute_kaggle_metric( predict, coupling_value, coupling_type,)

        for t in range(NUM_COUPLING_TYPE):
            log.write('\tcoupling_type = %s\n'%COUPLING_TYPE[t])
            log.write('\tmae     =  %f\n'%mae[t])
            log.write('\tlog_mae = %+f\n'%log_mae[t])
            log.write('\n')
        log.write('\n')


        log.write('-- final -------------\n')
        log.write('\ttest_loss = %+f\n'%test_loss)
        log.write('\tmae       =  %f\n'%np.mean(mae))
        log.write('\tlog_mae   = %+f\n'%np.mean(log_mae))
        log.write('\n')


# main #################################################################
if __name__ == '__main__':
    print( '%s: calling main function ... ' % os.path.basename(__file__))
    parser = argparse.ArgumentParser()
    parser.add_argument('--out_dir', help= 'where to store prediction file')
    parser.add_argument('--model', help='model to make prediction from. model1 or model2')
    parser.add_argument('--checkpoint', help='checkpoint to make prediction from')
    opt = parser.parse_args()
    run_submit(opt.out_dir, opt.model, opt.checkpoint)