{"id":538,"date":"2023-01-16T10:34:12","date_gmt":"2023-01-16T02:34:12","guid":{"rendered":"https:\/\/scutvk.cn\/?p=538"},"modified":"2023-01-16T16:50:12","modified_gmt":"2023-01-16T08:50:12","slug":"document-level-argument-extraction-by-conditional-generation-%e5%a4%8d%e7%8e%b0","status":"publish","type":"post","link":"https:\/\/scutvk.cn\/?p=538","title":{"rendered":"Document-Level Argument Extraction by Conditional Generation \u590d\u73b0"},"content":{"rendered":"\n<p>\u5df2\u6dfb\u52a0OneIE\u5904\u7406\u540eACE2005\u6570\u636e\u96c6\u7684\u4ed3\u5e93\uff1a<a href=\"https:\/\/github.com\/vkgo\/gen-arg\" target=\"_blank\" rel=\"noopener\">vkgo\/gen-arg: Code for paper &#8220;Document-Level Argument Extraction by Conditional Generation&#8221;. NAACL 21&#8242; (github.com)<\/a><\/p>\n\n\n\n<p style=\"font-size:24px\"><strong>1 \u73af\u5883\u914d\u7f6e<\/strong><\/p>\n\n\n\n<p>\u6309\u8981\u6c42README\u914d\u7f6e\u597d<\/p>\n\n\n\n<figure class=\"wp-block-image size-full\"><img decoding=\"async\" loading=\"lazy\" width=\"314\" height=\"172\" src=\"https:\/\/x2.mday.top\/wp-content\/uploads\/2023\/01\/image.png\" alt=\"\" class=\"wp-image-539\" srcset=\"https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image.png 314w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-300x164.png 300w\" sizes=\"(max-width: 314px) 100vw, 314px\" \/><\/figure>\n\n\n\n<p style=\"font-size:24px\"><strong>2 \u8fd0\u884c\u5c1d\u8bd5<\/strong><\/p>\n\n\n\n<p>\u5c1d\u8bd5\u6267\u884c<code>train.py<\/code><\/p>\n\n\n\n<pre class=\"wp-block-code\"><code lang=\"bash\" class=\"language-bash line-numbers\">python train.py --model gen --dataset ACE<\/code><\/pre>\n\n\n\n<p>\u62a5\u9519\uff0c\u7f3a\u53c2\u6570<\/p>\n\n\n\n<figure class=\"wp-block-image size-large\"><img decoding=\"async\" loading=\"lazy\" width=\"1024\" height=\"368\" src=\"https:\/\/x2.mday.top\/wp-content\/uploads\/2023\/01\/image-20230115100940664-1024x368.png\" alt=\"\" class=\"wp-image-540\" srcset=\"https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115100940664-1024x368.png 1024w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115100940664-300x108.png 300w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115100940664-768x276.png 768w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115100940664-769x276.png 769w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115100940664.png 1057w\" sizes=\"(max-width: 1024px) 100vw, 1024px\" \/><\/figure>\n\n\n\n<p>\u4ed4\u7ec6\u770b\u4e00\u904d\u4ed3\u5e93\u6587\u4ef6\u540e\uff0c\u53d1\u73b0\u6709\u73b0\u6210\u7684scripts\uff0cACE 2005 script\u5982\u4e0b\uff1a<\/p>\n\n\n\n<figure class=\"wp-block-image size-full\"><img decoding=\"async\" loading=\"lazy\" width=\"544\" height=\"463\" src=\"https:\/\/x2.mday.top\/wp-content\/uploads\/2023\/01\/image-20230115101118874.png\" alt=\"\" class=\"wp-image-541\" srcset=\"https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115101118874.png 544w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115101118874-300x255.png 300w\" sizes=\"(max-width: 544px) 100vw, 544px\" \/><\/figure>\n\n\n\n<p>\u7ea2\u5708\u4e3a\u7f3a\u5c11\u7684\u6587\u4ef6\u3002<\/p>\n\n\n\n<p style=\"font-size:24px\"><strong>3 \u6570\u636e\u5904\u7406<\/strong><\/p>\n\n\n\n<p>\u901a\u8fc7\u4e0a\u8ff0\u7f3a\u5c11\u6587\u4ef6\u7684\u6587\u4ef6\u540d\u53ef\u4ee5\u731c\u6d4b\uff0c\u6570\u636e\u53ef\u80fd\u9700\u8981\u901a\u8fc7OneIE\u5904\u7406\u3002<\/p>\n\n\n\n<p>\u914d\u7f6e\u597dOneIE\u9879\u76ee\u540e\uff0c\u6267\u884c\u4ee5\u4e0b\u4ee3\u7801\u5904\u7406\u6570\u636e\uff1a<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code lang=\"bash\" class=\"language-bash line-numbers\">python preprocessing\/process_ace.py -i .\/data\/LDC2006T06\/data -o .\/data\/ACE2005-English-output -s resource\/splits\/ACE05-E -b bert-large-cased -l english<\/code><\/pre>\n\n\n\n<figure class=\"wp-block-image size-large\"><img decoding=\"async\" loading=\"lazy\" width=\"1024\" height=\"106\" src=\"https:\/\/x2.mday.top\/wp-content\/uploads\/2023\/01\/image-20230115103333948-1024x106.png\" alt=\"\" class=\"wp-image-542\" srcset=\"https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115103333948-1024x106.png 1024w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115103333948-300x31.png 300w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115103333948-768x79.png 768w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115103333948-1536x158.png 1536w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115103333948-769x79.png 769w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115103333948.png 1861w\" sizes=\"(max-width: 1024px) 100vw, 1024px\" \/><\/figure>\n\n\n\n<figure class=\"wp-block-image size-full\"><img decoding=\"async\" loading=\"lazy\" width=\"623\" height=\"168\" src=\"https:\/\/x2.mday.top\/wp-content\/uploads\/2023\/01\/image-20230115103342475.png\" alt=\"\" class=\"wp-image-543\" srcset=\"https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115103342475.png 623w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115103342475-300x81.png 300w\" sizes=\"(max-width: 623px) 100vw, 623px\" \/><\/figure>\n\n\n\n<p style=\"font-size:24px\"><strong>4 \u8fd0\u884c<\/strong><\/p>\n\n\n\n<p>\u6839\u636e\u5904\u7406\u540e\u7684\u6570\u636e\uff0c\u7b80\u5355\u4fee\u6539\u4e00\u4e0b\u8fd0\u884c\u547d\u4ee4\u3002<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code lang=\"bash\" class=\"language-bash line-numbers\">#!\/usr\/bin\/env bash\nset -e \nset -x \nDATA_DIR=.\/data\/ACE2005-English-oneie\nMODEL=constrained-gen\nCKPT_NAME=constrained-gen-ACE \n\n\nrm -rf checkpoints\/${CKPT_NAME}\npython train.py --model=${MODEL} --ckpt_name=${CKPT_NAME} \\\n    --dataset=ACE \\\n    --tmp_dir=preprocessed_ACE \\\n    --train_file=${DATA_DIR}\/train.oneie.json \\\n    --val_file=${DATA_DIR}\/dev.oneie.json \\\n    --test_file=${DATA_DIR}\/test.oneie.json \\\n    --train_batch_size=4 \\\n    --eval_batch_size=4 \\\n    --learning_rate=3e-5 \\\n    --accumulate_grad_batches=4 \\\n    --num_train_epochs=6 \\\n    --mark_trigger \n<\/code><\/pre>\n\n\n\n<p>Windows\u6ca1\u6709bash\uff0c\u4fee\u6539\u4e3a\uff1a<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code lang=\"bash\" class=\"language-bash line-numbers\">python train.py --model=constrained-gen --ckpt_name=constrained-gen-ACE --dataset=ACE --tmp_dir=preprocessed_ACE --train_file=.\/data\/ACE2005-English-oneie\/train.oneie.json --val_file=.\/data\/ACE2005-English-oneie\/dev.oneie.json --test_file=.\/data\/ACE2005-English-oneie\/test.oneie.json --train_batch_size=4 --eval_batch_size=4 --learning_rate=3e-5 --accumulate_grad_batches=4 --num_train_epochs=6 --mark_trigger<\/code><\/pre>\n\n\n\n<p>\u7b80\u5355debug\uff08\u5220\u9664\u4e4b\u524d\u5c1d\u8bd5\u7684\u65f6\u5019\u751f\u6210\u7684\u8bb8\u591a\u4e34\u65f6\u6587\u4ef6\u5939\u3001\u663e\u5b58\u4e0d\u8db3\u8c03\u4f4ebatchsize\uff09\uff0c\u6210\u529f\u8fd0\u884c\uff1a<\/p>\n\n\n\n<figure class=\"wp-block-image size-large\"><img decoding=\"async\" loading=\"lazy\" width=\"1024\" height=\"144\" src=\"https:\/\/x2.mday.top\/wp-content\/uploads\/2023\/01\/image-20230115104406190-1024x144.png\" alt=\"\" class=\"wp-image-544\" srcset=\"https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115104406190-1024x144.png 1024w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115104406190-300x42.png 300w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115104406190-768x108.png 768w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115104406190-1536x216.png 1536w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115104406190-769x108.png 769w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115104406190.png 1864w\" sizes=\"(max-width: 1024px) 100vw, 1024px\" \/><\/figure>\n\n\n\n<figure class=\"wp-block-image size-full\"><img decoding=\"async\" loading=\"lazy\" width=\"963\" height=\"549\" src=\"https:\/\/x2.mday.top\/wp-content\/uploads\/2023\/01\/image-20230115104647405.png\" alt=\"\" class=\"wp-image-545\" srcset=\"https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115104647405.png 963w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115104647405-300x171.png 300w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115104647405-768x438.png 768w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115104647405-769x438.png 769w\" sizes=\"(max-width: 963px) 100vw, 963px\" \/><\/figure>\n\n\n\n<p>\u6210\u529f\u8dd1\u5b8c1\u4e2aepoch<\/p>\n\n\n\n<figure class=\"wp-block-image size-large\"><img decoding=\"async\" loading=\"lazy\" width=\"1024\" height=\"226\" src=\"https:\/\/x2.mday.top\/wp-content\/uploads\/2023\/01\/image-20230115105355722-1024x226.png\" alt=\"\" class=\"wp-image-546\" srcset=\"https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115105355722-1024x226.png 1024w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115105355722-300x66.png 300w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115105355722-768x170.png 768w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115105355722-1536x339.png 1536w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115105355722-769x170.png 769w, https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115105355722.png 1871w\" sizes=\"(max-width: 1024px) 100vw, 1024px\" \/><\/figure>\n\n\n\n<p><\/p>\n","protected":false},"excerpt":{"rendered":"<p>\u5df2\u6dfb\u52a0OneIE\u5904\u7406\u540eACE2005\u6570\u636e\u96c6\u7684\u4ed3\u5e93\uff1a&hellip;<\/p>\n","protected":false},"author":1,"featured_media":546,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"jetpack_publicize_message":"","jetpack_is_tweetstorm":false,"jetpack_publicize_feature_enabled":true,"jetpack_social_post_already_shared":false,"jetpack_social_options":{"image_generator_settings":{"template":"highway","enabled":false}}},"categories":[10,12,2,3],"tags":[],"jetpack_publicize_connections":[],"jetpack_featured_media_url":"https:\/\/scutvk.cn\/wp-content\/uploads\/2023\/01\/image-20230115105355722.png","_links":{"self":[{"href":"https:\/\/scutvk.cn\/index.php?rest_route=\/wp\/v2\/posts\/538"}],"collection":[{"href":"https:\/\/scutvk.cn\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/scutvk.cn\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/scutvk.cn\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/scutvk.cn\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=538"}],"version-history":[{"count":2,"href":"https:\/\/scutvk.cn\/index.php?rest_route=\/wp\/v2\/posts\/538\/revisions"}],"predecessor-version":[{"id":557,"href":"https:\/\/scutvk.cn\/index.php?rest_route=\/wp\/v2\/posts\/538\/revisions\/557"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/scutvk.cn\/index.php?rest_route=\/wp\/v2\/media\/546"}],"wp:attachment":[{"href":"https:\/\/scutvk.cn\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=538"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/scutvk.cn\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=538"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/scutvk.cn\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=538"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}