diff --git a/tutorials/classification/bert.ipynb b/tutorials/classification/bert.ipynb index b1ccef7..ccb7a11 100644 --- a/tutorials/classification/bert.ipynb +++ b/tutorials/classification/bert.ipynb @@ -67,11 +67,15 @@ "source": [ "trainset = mz.dataloader.Dataset(\n", " data_pack=train_pack_processed,\n", - " mode='point'\n", + " mode='point',\n", + " batch_size=20,\n", + " sort=False\n", ")\n", "testset = mz.dataloader.Dataset(\n", " data_pack=test_pack_processed,\n", - " mode='point'\n", + " mode='point',\n", + " batch_size=20,\n", + " sort=False\n", ")" ] }, @@ -84,16 +88,12 @@ "padding_callback = mz.models.Bert.get_default_padding_callback()\n", "trainloader = mz.dataloader.DataLoader(\n", " dataset=trainset,\n", - " batch_size=20,\n", " stage='train',\n", - " sort=False,\n", " callback=padding_callback\n", ")\n", "testloader = mz.dataloader.DataLoader(\n", " dataset=testset,\n", - " batch_size=20,\n", " stage='dev',\n", - " sort=False,\n", " callback=padding_callback\n", ")" ] @@ -713,8 +713,17 @@ "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.8" + }, + "pycharm": { + "stem_cell": { + "cell_type": "raw", + "source": [], + "metadata": { + "collapsed": false + } + } } }, "nbformat": 4, "nbformat_minor": 2 -} +} \ No newline at end of file diff --git a/tutorials/classification/esim.ipynb b/tutorials/classification/esim.ipynb index 34d9d54..026fd5f 100644 --- a/tutorials/classification/esim.ipynb +++ b/tutorials/classification/esim.ipynb @@ -169,11 +169,15 @@ "source": [ "trainset = mz.dataloader.Dataset(\n", " data_pack=train_pack_processed,\n", - " mode='point'\n", + " mode='point',\n", + " batch_size=40,\n", + " sort=False\n", ")\n", "devset = mz.dataloader.Dataset(\n", " data_pack=dev_pack_processed,\n", - " mode='point'\n", + " mode='point',\n", + " batch_size=40,\n", + " sort=False\n", ")" ] }, @@ -187,16 +191,12 @@ "\n", "trainloader = mz.dataloader.DataLoader(\n", " dataset=trainset,\n", - " batch_size=40,\n", " stage='train',\n", - " sort=False,\n", " callback=padding_callback\n", ")\n", "devloader = mz.dataloader.DataLoader(\n", " dataset=devset,\n", - " batch_size=40,\n", " stage='dev',\n", - " sort=False,\n", " callback=padding_callback\n", ")" ] @@ -418,8 +418,17 @@ "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.7.3" + }, + "pycharm": { + "stem_cell": { + "cell_type": "raw", + "source": [], + "metadata": { + "collapsed": false + } + } } }, "nbformat": 4, "nbformat_minor": 2 -} +} \ No newline at end of file diff --git a/tutorials/ranking/anmm.ipynb b/tutorials/ranking/anmm.ipynb index faa7ae2..8ba8acc 100644 --- a/tutorials/ranking/anmm.ipynb +++ b/tutorials/ranking/anmm.ipynb @@ -136,10 +136,17 @@ " data_pack=train_pack_processed,\n", " mode='pair',\n", " num_dup=2,\n", - " num_neg=1\n", + " num_neg=1,\n", + " batch_size=20,\n", + " resample=True,\n", + " sort=False,\n", + " shuffle=True\n", ")\n", "testset = mz.dataloader.Dataset(\n", - " data_pack=test_pack_processed\n", + " data_pack=test_pack_processed,\n", + " batch_size=20,\n", + " sort=False,\n", + " shuffle=False\n", ")" ] }, @@ -153,19 +160,12 @@ "\n", "trainloader = mz.dataloader.DataLoader(\n", " dataset=trainset,\n", - " batch_size=20,\n", " stage='train',\n", - " resample=True,\n", - " sort=False,\n", - " shuffle=True,\n", " callback=padding_callback,\n", ")\n", "testloader = mz.dataloader.DataLoader(\n", " dataset=testset,\n", - " batch_size=20,\n", " stage='dev',\n", - " sort=False,\n", - " shuffle=False,\n", " callback=padding_callback,\n", ")" ] @@ -604,8 +604,17 @@ "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.7.4" + }, + "pycharm": { + "stem_cell": { + "cell_type": "raw", + "source": [], + "metadata": { + "collapsed": false + } + } } }, "nbformat": 4, "nbformat_minor": 2 -} +} \ No newline at end of file diff --git a/tutorials/ranking/arci.ipynb b/tutorials/ranking/arci.ipynb index e963fe4..ae184e0 100644 --- a/tutorials/ranking/arci.ipynb +++ b/tutorials/ranking/arci.ipynb @@ -145,10 +145,14 @@ " data_pack=train_pack_processed,\n", " mode='pair',\n", " num_dup=2,\n", - " num_neg=1\n", + " num_neg=1,\n", + " batch_size=20,\n", + " resample=True,\n", + " sort=False\n", ")\n", "testset = mz.dataloader.Dataset(\n", - " data_pack=test_pack_processed\n", + " data_pack=test_pack_processed,\n", + " batch_size=20\n", ")" ] }, @@ -167,15 +171,11 @@ "\n", "trainloader = mz.dataloader.DataLoader(\n", " dataset=trainset,\n", - " batch_size=20,\n", " stage='train',\n", - " resample=True,\n", - " sort=False,\n", " callback=padding_callback\n", ")\n", "testloader = mz.dataloader.DataLoader(\n", " dataset=testset,\n", - " batch_size=20,\n", " stage='dev',\n", " callback=padding_callback\n", ")" @@ -584,8 +584,17 @@ "_Feature" ], "window_display": false + }, + "pycharm": { + "stem_cell": { + "cell_type": "raw", + "source": [], + "metadata": { + "collapsed": false + } + } } }, "nbformat": 4, "nbformat_minor": 4 -} +} \ No newline at end of file diff --git a/tutorials/ranking/arcii.ipynb b/tutorials/ranking/arcii.ipynb index 3ca51f5..7f83dae 100644 --- a/tutorials/ranking/arcii.ipynb +++ b/tutorials/ranking/arcii.ipynb @@ -145,10 +145,14 @@ " data_pack=train_pack_processed,\n", " mode='pair',\n", " num_dup=2,\n", - " num_neg=1\n", + " num_neg=1,\n", + " batch_size=20,\n", + " resample=True,\n", + " sort=False\n", ")\n", "testset = mz.dataloader.Dataset(\n", - " data_pack=test_pack_processed\n", + " data_pack=test_pack_processed,\n", + " batch_size=20\n", ")" ] }, @@ -167,15 +171,11 @@ "\n", "trainloader = mz.dataloader.DataLoader(\n", " dataset=trainset,\n", - " batch_size=20,\n", " stage='train',\n", - " resample=True,\n", - " sort=False,\n", " callback=padding_callback\n", ")\n", "testloader = mz.dataloader.DataLoader(\n", " dataset=testset,\n", - " batch_size=20,\n", " stage='dev',\n", " callback=padding_callback\n", ")" @@ -575,8 +575,17 @@ "_Feature" ], "window_display": false + }, + "pycharm": { + "stem_cell": { + "cell_type": "raw", + "source": [], + "metadata": { + "collapsed": false + } + } } }, "nbformat": 4, "nbformat_minor": 4 -} +} \ No newline at end of file diff --git a/tutorials/ranking/bert.ipynb b/tutorials/ranking/bert.ipynb index 51a4b10..8237048 100644 --- a/tutorials/ranking/bert.ipynb +++ b/tutorials/ranking/bert.ipynb @@ -69,10 +69,14 @@ " data_pack=train_pack_processed,\n", " mode='pair',\n", " num_dup=2,\n", - " num_neg=1\n", + " num_neg=1,\n", + " batch_size=20,\n", + " resample=True,\n", + " sort=False\n", ")\n", "testset = mz.dataloader.Dataset(\n", - " data_pack=test_pack_processed\n", + " data_pack=test_pack_processed,\n", + " batch_size=20\n", ")" ] }, @@ -85,15 +89,11 @@ "padding_callback = mz.models.Bert.get_default_padding_callback()\n", "trainloader = mz.dataloader.DataLoader(\n", " dataset=trainset,\n", - " batch_size=20,\n", " stage='train',\n", - " resample=True,\n", - " sort=False,\n", " callback=padding_callback\n", ")\n", "testloader = mz.dataloader.DataLoader(\n", " dataset=testset,\n", - " batch_size=20,\n", " stage='dev',\n", " callback=padding_callback\n", ")" @@ -711,8 +711,17 @@ "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.8" + }, + "pycharm": { + "stem_cell": { + "cell_type": "raw", + "source": [], + "metadata": { + "collapsed": false + } + } } }, "nbformat": 4, "nbformat_minor": 2 -} +} \ No newline at end of file diff --git a/tutorials/ranking/cdssm.ipynb b/tutorials/ranking/cdssm.ipynb index ad278d2..778d9cb 100644 --- a/tutorials/ranking/cdssm.ipynb +++ b/tutorials/ranking/cdssm.ipynb @@ -121,10 +121,15 @@ " mode='pair',\n", " num_dup=2,\n", " num_neg=1,\n", + " batch_size=20,\n", + " sort=False,\n", + " resample=True,\n", " callbacks=[triletter_callback]\n", ")\n", "testset = mz.dataloader.Dataset(\n", " data_pack=test_pack_processed,\n", + " batch_size=20,\n", + " sort=False,\n", " callbacks=[triletter_callback]\n", ")" ] @@ -142,17 +147,12 @@ "\n", "trainloader = mz.dataloader.DataLoader(\n", " dataset=trainset,\n", - " batch_size=20,\n", " stage='train',\n", - " sort=False,\n", - " resample=True,\n", " callback=padding_callback\n", ")\n", "testloader = mz.dataloader.DataLoader(\n", " dataset=testset,\n", - " batch_size=20,\n", " stage='dev',\n", - " sort=False,\n", " callback=padding_callback\n", ")" ] @@ -508,8 +508,17 @@ "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.9" + }, + "pycharm": { + "stem_cell": { + "cell_type": "raw", + "source": [], + "metadata": { + "collapsed": false + } + } } }, "nbformat": 4, "nbformat_minor": 2 -} +} \ No newline at end of file diff --git a/tutorials/ranking/conv_knrm.ipynb b/tutorials/ranking/conv_knrm.ipynb index 3a6d364..e9fe31b 100644 --- a/tutorials/ranking/conv_knrm.ipynb +++ b/tutorials/ranking/conv_knrm.ipynb @@ -148,10 +148,14 @@ " data_pack=train_pack_processed,\n", " mode='pair',\n", " num_dup=5,\n", - " num_neg=1\n", + " num_neg=1,\n", + " batch_size=20,\n", + " resample=True,\n", + " sort=False\n", ")\n", "testset = mz.dataloader.Dataset(\n", - " data_pack=test_pack_processed\n", + " data_pack=test_pack_processed,\n", + " batch_size=20\n", ")" ] }, @@ -165,15 +169,11 @@ "\n", "trainloader = mz.dataloader.DataLoader(\n", " dataset=trainset,\n", - " batch_size=20,\n", " stage='train',\n", - " resample=True,\n", - " sort=False,\n", " callback=padding_callback\n", ")\n", "testloader = mz.dataloader.DataLoader(\n", " dataset=testset,\n", - " batch_size=20,\n", " stage='dev',\n", " callback=padding_callback\n", ")" @@ -597,8 +597,17 @@ "_Feature" ], "window_display": false + }, + "pycharm": { + "stem_cell": { + "cell_type": "raw", + "source": [], + "metadata": { + "collapsed": false + } + } } }, "nbformat": 4, "nbformat_minor": 4 -} +} \ No newline at end of file diff --git a/tutorials/ranking/drmm.ipynb b/tutorials/ranking/drmm.ipynb index cbe2d7c..ee99ac3 100644 --- a/tutorials/ranking/drmm.ipynb +++ b/tutorials/ranking/drmm.ipynb @@ -147,10 +147,13 @@ " mode='pair',\n", " num_dup=5,\n", " num_neg=10,\n", + " batch_size=20,\n", + " resample=True,\n", " callbacks=[histgram_callback]\n", ")\n", "testset = mz.dataloader.Dataset(\n", " data_pack=test_pack_processed,\n", + " batch_size=20,\n", " callbacks=[histgram_callback]\n", ")" ] @@ -166,14 +169,11 @@ "trainloader = mz.dataloader.DataLoader(\n", " device='cpu',\n", " dataset=trainset,\n", - " batch_size=20,\n", " stage='train',\n", - " resample=True,\n", " callback=padding_callback\n", ")\n", "testloader = mz.dataloader.DataLoader(\n", " dataset=testset,\n", - " batch_size=20,\n", " stage='dev',\n", " callback=padding_callback\n", ")" @@ -507,8 +507,17 @@ "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.9" + }, + "pycharm": { + "stem_cell": { + "cell_type": "raw", + "source": [], + "metadata": { + "collapsed": false + } + } } }, "nbformat": 4, "nbformat_minor": 2 -} +} \ No newline at end of file diff --git a/tutorials/ranking/dssm.ipynb b/tutorials/ranking/dssm.ipynb index 270d68f..fc6b247 100644 --- a/tutorials/ranking/dssm.ipynb +++ b/tutorials/ranking/dssm.ipynb @@ -127,10 +127,13 @@ " mode='pair',\n", " num_dup=1,\n", " num_neg=4,\n", + " batch_size=32,\n", + " resample=True,\n", " callbacks=[triletter_callback]\n", ")\n", "testset = mz.dataloader.Dataset(\n", " data_pack=test_pack_processed,\n", + " batch_size=32,\n", " callbacks=[triletter_callback]\n", ")" ] @@ -145,14 +148,11 @@ "\n", "trainloader = mz.dataloader.DataLoader(\n", " dataset=trainset,\n", - " batch_size=32,\n", " stage='train',\n", - " resample=True,\n", " callback=padding_callback\n", ")\n", "testloader = mz.dataloader.DataLoader(\n", " dataset=testset,\n", - " batch_size=32,\n", " stage='dev',\n", " callback=padding_callback\n", ")" @@ -501,8 +501,17 @@ "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.9" + }, + "pycharm": { + "stem_cell": { + "cell_type": "raw", + "source": [], + "metadata": { + "collapsed": false + } + } } }, "nbformat": 4, "nbformat_minor": 2 -} +} \ No newline at end of file diff --git a/tutorials/ranking/duet.ipynb b/tutorials/ranking/duet.ipynb index bc64ad6..e916750 100644 --- a/tutorials/ranking/duet.ipynb +++ b/tutorials/ranking/duet.ipynb @@ -163,10 +163,14 @@ " mode='pair',\n", " num_dup=2,\n", " num_neg=1,\n", + " batch_size=20,\n", + " resample=True,\n", + " sort=False,\n", " callbacks=[triletter_callback]\n", ")\n", "testset = mz.dataloader.Dataset(\n", " data_pack=test_pack_processed,\n", + " batch_size=20,\n", " callbacks=[triletter_callback]\n", ")" ] @@ -187,15 +191,11 @@ "\n", "trainloader = mz.dataloader.DataLoader(\n", " dataset=trainset,\n", - " batch_size=20,\n", " stage='train',\n", - " resample=True,\n", - " sort=False,\n", " callback=padding_callback\n", ")\n", "testloader = mz.dataloader.DataLoader(\n", " dataset=testset,\n", - " batch_size=20,\n", " stage='dev',\n", " callback=padding_callback\n", ")" @@ -435,8 +435,17 @@ "_Feature" ], "window_display": false + }, + "pycharm": { + "stem_cell": { + "cell_type": "raw", + "source": [], + "metadata": { + "collapsed": false + } + } } }, "nbformat": 4, "nbformat_minor": 4 -} +} \ No newline at end of file diff --git a/tutorials/ranking/esim.ipynb b/tutorials/ranking/esim.ipynb index 65efe61..b64f327 100644 --- a/tutorials/ranking/esim.ipynb +++ b/tutorials/ranking/esim.ipynb @@ -146,10 +146,17 @@ " data_pack=train_pack_processed,\n", " mode='pair',\n", " num_dup=5,\n", - " num_neg=10\n", + " num_neg=10,\n", + " batch_size=20,\n", + " resample=True,\n", + " sort=False,\n", + " shuffle=True\n", ")\n", "testset = mz.dataloader.Dataset(\n", - " data_pack=test_pack_processed\n", + " data_pack=test_pack_processed,\n", + " batch_size=20,\n", + " sort=False,\n", + " shuffle=False\n", ")" ] }, @@ -163,19 +170,12 @@ "\n", "trainloader = mz.dataloader.DataLoader(\n", " dataset=trainset,\n", - " batch_size=20,\n", " stage='train',\n", - " resample=True,\n", - " sort=False,\n", - " shuffle=True,\n", " callback=padding_callback\n", ")\n", "testloader = mz.dataloader.DataLoader(\n", " dataset=testset,\n", - " batch_size=20,\n", " stage='dev',\n", - " sort=False,\n", - " shuffle=False,\n", " callback=padding_callback\n", ")" ] @@ -514,8 +514,17 @@ "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.8" + }, + "pycharm": { + "stem_cell": { + "cell_type": "raw", + "source": [], + "metadata": { + "collapsed": false + } + } } }, "nbformat": 4, "nbformat_minor": 2 -} +} \ No newline at end of file diff --git a/tutorials/ranking/knrm.ipynb b/tutorials/ranking/knrm.ipynb index 9dcd089..d6c9499 100644 --- a/tutorials/ranking/knrm.ipynb +++ b/tutorials/ranking/knrm.ipynb @@ -152,10 +152,14 @@ " data_pack=train_pack_processed,\n", " mode='pair',\n", " num_dup=5,\n", - " num_neg=1\n", + " num_neg=1,\n", + " batch_size=20,\n", + " resample=True,\n", + " sort=False\n", ")\n", "testset = mz.dataloader.Dataset(\n", - " data_pack=test_pack_processed\n", + " data_pack=test_pack_processed,\n", + " batch_size=20,\n", ")" ] }, @@ -169,15 +173,11 @@ "\n", "trainloader = mz.dataloader.DataLoader(\n", " dataset=trainset,\n", - " batch_size=20,\n", " stage='train',\n", - " resample=True,\n", - " sort=False,\n", " callback=padding_callback\n", ")\n", "testloader = mz.dataloader.DataLoader(\n", " dataset=testset,\n", - " batch_size=20,\n", " stage='dev',\n", " callback=padding_callback\n", ")" @@ -570,8 +570,17 @@ "_Feature" ], "window_display": false + }, + "pycharm": { + "stem_cell": { + "cell_type": "raw", + "source": [], + "metadata": { + "collapsed": false + } + } } }, "nbformat": 4, "nbformat_minor": 4 -} +} \ No newline at end of file diff --git a/tutorials/ranking/match_srnn.ipynb b/tutorials/ranking/match_srnn.ipynb index c391696..dd9b691 100644 --- a/tutorials/ranking/match_srnn.ipynb +++ b/tutorials/ranking/match_srnn.ipynb @@ -155,10 +155,14 @@ " data_pack=train_pack_processed,\n", " mode='pair',\n", " num_dup=2,\n", - " num_neg=1\n", + " num_neg=1,\n", + " batch_size=20,\n", + " resample=True,\n", + " sort=False\n", ")\n", "testset = mz.dataloader.Dataset(\n", - " data_pack=test_pack_processed\n", + " data_pack=test_pack_processed,\n", + " batch_size=20,\n", ")" ] }, @@ -177,15 +181,11 @@ "\n", "trainloader = mz.dataloader.DataLoader(\n", " dataset=trainset,\n", - " batch_size=20,\n", " stage='train',\n", - " resample=True,\n", - " sort=False,\n", " callback=padding_callback\n", ")\n", "testloader = mz.dataloader.DataLoader(\n", " dataset=testset,\n", - " batch_size=20,\n", " stage='dev',\n", " callback=padding_callback\n", ")" @@ -532,8 +532,17 @@ "name": "python", "npconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": 3 + "version": 3, + "pycharm": { + "stem_cell": { + "cell_type": "raw", + "source": [], + "metadata": { + "collapsed": false + } + } + } }, "nbformat": 4, "nbformat_minor": 2 -} +} \ No newline at end of file diff --git a/tutorials/ranking/matchlstm.ipynb b/tutorials/ranking/matchlstm.ipynb index 4a952ff..edf8737 100644 --- a/tutorials/ranking/matchlstm.ipynb +++ b/tutorials/ranking/matchlstm.ipynb @@ -146,10 +146,17 @@ " data_pack=train_pack_processed,\n", " mode='pair',\n", " num_dup=5,\n", - " num_neg=10\n", + " num_neg=10,\n", + " batch_size=20,\n", + " resample=True,\n", + " sort=False,\n", + " shuffle=True\n", ")\n", "testset = mz.dataloader.Dataset(\n", - " data_pack=test_pack_processed\n", + " data_pack=test_pack_processed,\n", + " batch_size=20,\n", + " sort=False,\n", + " shuffle=False\n", ")" ] }, @@ -163,19 +170,12 @@ "\n", "trainloader = mz.dataloader.DataLoader(\n", " dataset=trainset,\n", - " batch_size=20,\n", " stage='train',\n", - " resample=True,\n", - " sort=False,\n", - " shuffle=True,\n", " callback=padding_callback\n", ")\n", "testloader = mz.dataloader.DataLoader(\n", " dataset=testset,\n", - " batch_size=20,\n", " stage='dev',\n", - " sort=False,\n", - " shuffle=False,\n", " callback=padding_callback\n", ")" ] @@ -508,8 +508,17 @@ "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.8" + }, + "pycharm": { + "stem_cell": { + "cell_type": "raw", + "source": [], + "metadata": { + "collapsed": false + } + } } }, "nbformat": 4, "nbformat_minor": 2 -} +} \ No newline at end of file