<?xml version="1.0" encoding="utf-8" standalone="yes"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9"
  xmlns:xhtml="http://www.w3.org/1999/xhtml">
  <url>
    <loc>https://sino-huang.github.io/research-idea/neuro-symbolic-instruction-following-normal/literature-on-nl-granularity/</loc>
    <lastmod>2025-09-01T16:04:04+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/research-idea/nsai-multi-agent-communiation/</loc>
    <lastmod>2025-06-29T16:04:23+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/research-idea/neuro-symbolic-instruction-following-normal/</loc>
    <lastmod>2025-06-29T16:04:04+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/research-idea/neuro-symbolic-instruction-following-normal/behavior-aware-balancing/</loc>
    <lastmod>2025-06-29T16:04:04+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/research-idea/neuro-symbolic-instruction-following-normal/generalization-ability/</loc>
    <lastmod>2025-06-29T16:04:04+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/research-idea/neuro-symbolic-instruction-following-normal/incremental_progress_proposal/</loc>
    <lastmod>2025-06-29T16:04:04+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/research-idea/neuro-symbolic-instruction-following-normal/pragmatic-feature-selection/</loc>
    <lastmod>2025-06-29T16:04:04+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/research-idea/neuro-symbolic-instruction-following-normal/vla-monitor-technique/</loc>
    <lastmod>2025-06-29T16:04:04+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/research-idea/awesome-ideas/language-abstraction/</loc>
    <lastmod>2025-06-27T22:49:29+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/research-idea/awesome-ideas/</loc>
    <lastmod>2025-06-07T22:49:29+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/research-idea/awesome-ideas/literature-review-gen/</loc>
    <lastmod>2025-06-07T22:49:29+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/research-idea/awesome-ideas/vllm-vs-vla/</loc>
    <lastmod>2025-06-07T22:49:29+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/categories/</loc>
    <lastmod>2025-09-01T16:04:04+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/categories/research-idea/</loc>
    <lastmod>2025-09-01T16:04:04+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/research-idea/</loc>
    <lastmod>2025-09-01T16:04:04+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/</loc>
    <lastmod>2025-09-01T16:04:04+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/concept-erase/</loc>
    <lastmod>2025-04-02T17:17:26+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/null-space/</loc>
    <lastmod>2025-04-02T17:17:26+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/categories/paper-review/</loc>
    <lastmod>2025-04-02T17:17:26+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/</loc>
    <lastmod>2025-04-02T17:17:26+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/svd_speed_concept_erasing_2025/</loc>
    <lastmod>2025-04-02T17:17:26+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/svd/</loc>
    <lastmod>2025-04-02T17:17:26+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/</loc>
    <lastmod>2025-04-02T17:17:26+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/awesome_life_long_rl_2025/</loc>
    <lastmod>2025-03-16T23:03:05+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/forgetting-of-pre-trained-capabilities/</loc>
    <lastmod>2025-03-16T23:03:05+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/lifelong-rl/</loc>
    <lastmod>2025-03-16T23:03:05+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/multi-task-rl/</loc>
    <lastmod>2025-03-16T23:03:05+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/categories/paper-review-collection/</loc>
    <lastmod>2025-03-16T23:03:05+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/awesome_llm_and_diff_abst_of_language_info_2025/</loc>
    <lastmod>2025-03-16T22:17:16+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/level-of-abstraction-of-language-instruction/</loc>
    <lastmod>2025-03-16T22:17:16+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llms-as-modelers/</loc>
    <lastmod>2025-03-13T10:19:40+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llms-as-planners/</loc>
    <lastmod>2025-03-13T10:19:40+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llms-for-planning/</loc>
    <lastmod>2025-03-13T10:19:40+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/survey_of_llm_for_planning_2025/</loc>
    <lastmod>2025-03-13T10:19:40+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/htn-planning/</loc>
    <lastmod>2025-03-05T09:44:58+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/htn_planning_by_pascal_2025/</loc>
    <lastmod>2025-03-05T09:44:58+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/knowledge-representation/</loc>
    <lastmod>2025-03-04T12:07:13+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/learning_general_policy_by_hector_2025/</loc>
    <lastmod>2025-03-04T12:07:13+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/sketch/</loc>
    <lastmod>2025-03-04T12:07:13+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/shenan-model-based-rpgm-2023/</loc>
    <lastmod>2025-03-02T23:24:05+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/rp-pgms/</loc>
    <lastmod>2025-03-02T23:24:05+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llm-as-policy-model-in-online-rl-setting/</loc>
    <lastmod>2025-03-01T21:49:37+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/categories/paper-collection-review/</loc>
    <lastmod>2025-03-01T21:49:37+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/awesome_llm_for_embodied_rl_and_decision_making_by_2025/</loc>
    <lastmod>2025-03-01T21:49:37+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/neuro_symbolic_works_from_hamid_2024_2025/</loc>
    <lastmod>2025-02-26T12:53:37+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/neuro-symbolic/</loc>
    <lastmod>2025-02-26T12:53:37+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/awesome_llm_reasoning_capability_papers/</loc>
    <lastmod>2025-02-09T21:07:11+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llm-reasoning/</loc>
    <lastmod>2025-02-09T21:07:11+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llm-and-pddl/</loc>
    <lastmod>2024-12-24T22:25:58+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llm-planner/</loc>
    <lastmod>2024-12-24T22:25:58+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/pallagani-plansformer-generating-plans-2023/</loc>
    <lastmod>2024-12-24T22:25:58+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/damai-dai-deepseekmoe-2024/</loc>
    <lastmod>2024-06-22T11:13:50+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llm/</loc>
    <lastmod>2024-06-22T11:13:50+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/mixture-of-experts/</loc>
    <lastmod>2024-06-22T11:13:50+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jessy-lin-learning-to-model-the-world-with-language-2024/</loc>
    <lastmod>2024-06-21T11:47:25+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llm-rl/</loc>
    <lastmod>2024-06-21T11:47:25+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/world-model/</loc>
    <lastmod>2024-06-21T11:47:25+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llm-verification/</loc>
    <lastmod>2024-06-20T20:19:12+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/categories/topic-review/</loc>
    <lastmod>2024-06-20T20:19:12+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/verification-in-llm-topic-2024/</loc>
    <lastmod>2024-06-20T20:19:12+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jiuzhou-reward-engineering-for-generating-semi-structured-explan-2023/</loc>
    <lastmod>2024-06-20T14:11:32+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/reward-model/</loc>
    <lastmod>2024-06-20T14:11:32+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jiuzhou-towards-uncertaintty-aware-lang-agent-2024/</loc>
    <lastmod>2024-06-20T11:15:18+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/language-agent/</loc>
    <lastmod>2024-06-20T11:15:18+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/uncertainty-handling/</loc>
    <lastmod>2024-06-20T11:15:18+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/noisy-reward/</loc>
    <lastmod>2024-05-10T22:23:31+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/rl-reward/</loc>
    <lastmod>2024-05-10T22:23:31+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/silviu-pitis-failure-modes-of-learning-reward-models-for-sequence-model-2023/</loc>
    <lastmod>2024-05-10T22:23:31+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/gaurav-ghosal-the-effect-of-modeling-human-rationality-level-2023/</loc>
    <lastmod>2024-05-10T19:35:03+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/nate-rahn-policy-optimization-in-noisy-neighbourhood-2023/</loc>
    <lastmod>2024-05-10T14:16:56+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/ademi-adeniji-language-reward-modulation-for-pretraining-rl-2023/</loc>
    <lastmod>2024-05-09T21:18:00+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/thomas-coste-reward-model-ensembles-help-mitigate-overoptimization-2024/</loc>
    <lastmod>2024-05-09T14:06:33+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/mengdi-li-internally-rewarded-rl-2023/</loc>
    <lastmod>2024-05-08T14:59:15+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/xuran-pan-on-the-integration-of-self-attention-and-convolution-2022/</loc>
    <lastmod>2024-04-25T17:53:46+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/recent-language-model-technique-2024/</loc>
    <lastmod>2024-04-25T12:49:03+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/revision/</loc>
    <lastmod>2024-04-25T12:49:03+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llm-policy/</loc>
    <lastmod>2024-04-23T13:20:22+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/thomas-carta-grounding-llms-in-rl-2023/</loc>
    <lastmod>2024-04-23T13:20:22+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/daniel-hierarchies-of-reward-machines-2023/</loc>
    <lastmod>2024-04-12T15:12:54+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/intrinsic-reward/</loc>
    <lastmod>2024-04-12T15:12:54+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/shanchuan-efficient-n-robust-exploration-through-discriminative-ir-2023/</loc>
    <lastmod>2024-04-12T15:07:58+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/programming-notes/how-to-autostart-apps-on-your-server/</loc>
    <lastmod>2024-04-12T12:23:29+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/categories/programming-notes/</loc>
    <lastmod>2024-04-12T12:23:29+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/programming-notes/</loc>
    <lastmod>2024-04-12T12:23:29+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/seungyong-discover-hierarchical-achieve-in-rl-via-cl-2023/</loc>
    <lastmod>2024-04-02T21:02:37+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/hierarchical-rl/</loc>
    <lastmod>2024-04-02T21:02:37+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/programming-notes/using-kedro-n-optuna-for-your-project/</loc>
    <lastmod>2024-03-27T21:50:10+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/chain-of-thought/</loc>
    <lastmod>2024-02-28T19:59:38+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/code-generation/</loc>
    <lastmod>2024-02-28T19:59:38+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jia-li-structured-cot-prompting-for-code-generation-2023/</loc>
    <lastmod>2024-02-28T19:59:38+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/confidence-estimation/</loc>
    <lastmod>2024-02-28T16:12:53+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/stephanie-teaching-models-to-express-their-uncertainty-in-words-2022/</loc>
    <lastmod>2024-02-28T16:12:53+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/gwenyth-estimating-confidence-of-llm-by-prompt-agreement-2023/</loc>
    <lastmod>2024-02-27T15:44:06+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/sudhir-agarwal-translate-infer-compile-for-accurate-text-to-plan-2024/</loc>
    <lastmod>2024-02-17T12:56:25+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/programming-notes/how-to-design-your-research-project-structure/</loc>
    <lastmod>2024-02-02T19:50:31+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/ai-assistant/</loc>
    <lastmod>2024-01-30T23:17:51+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/philip-cohen-intention-is-choice-with-commitment-1990/</loc>
    <lastmod>2024-01-30T23:17:51+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/theory/</loc>
    <lastmod>2024-01-30T23:17:51+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/christian-muise-planning-for-goal-oriented-dialgue-systems-2019/</loc>
    <lastmod>2024-01-30T16:58:06+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/planning-for-dialogue-ai/</loc>
    <lastmod>2024-01-30T16:58:06+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/survey/</loc>
    <lastmod>2024-01-29T23:02:47+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/vishal-pallagani-llm-n-planning-survey-2024/</loc>
    <lastmod>2024-01-29T23:02:47+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/ishika-singh-progprompt-program-generation-for-robot-task-planning-2023/</loc>
    <lastmod>2024-01-29T20:45:59+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/avichai-levy-understanding-natural-language-in-context-2023/</loc>
    <lastmod>2024-01-29T20:25:43+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llm-cot/</loc>
    <lastmod>2024-01-29T17:44:10+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llm-empirical-strategy/</loc>
    <lastmod>2024-01-29T17:44:10+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/mingyu-jin-the-impact-of-reasoning-steps-length-on-llm-2024/</loc>
    <lastmod>2024-01-29T17:44:10+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llm-weak-supervision/</loc>
    <lastmod>2024-01-29T15:32:21+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/collin-burns-weak-to-strong-generalisation-weak-supervision-2023/</loc>
    <lastmod>2024-01-29T15:32:21+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llm-hallucination/</loc>
    <lastmod>2024-01-28T23:11:28+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/ziwei-xu-hallucination-is-inevitable-an-innate-limitation-llm-2024/</loc>
    <lastmod>2024-01-28T23:11:28+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/machine-translation-reward-model/</loc>
    <lastmod>2024-01-28T22:53:41+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/quality-estimation/</loc>
    <lastmod>2024-01-28T22:53:41+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/zhiwei-he-improving-machine-translation-use-quality-estimation-as-a-reward-model-2024/</loc>
    <lastmod>2024-01-28T22:53:41+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/krishan-rana-sayplan-grounding-llm-for-scalable-task-planning-2023/</loc>
    <lastmod>2024-01-28T21:37:21+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llm-planner-robotics/</loc>
    <lastmod>2024-01-28T21:37:21+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/robotics/</loc>
    <lastmod>2024-01-28T21:37:21+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/action-trajectory-constraints/</loc>
    <lastmod>2024-01-28T21:28:51+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/luigi-bonassi-planning-with-qualitative-constraints-pddl3-2022/</loc>
    <lastmod>2024-01-28T21:28:51+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/pddl3/</loc>
    <lastmod>2024-01-28T21:28:51+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/language-reward-shaping/</loc>
    <lastmod>2024-01-28T09:31:05+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/parsa-mahmoudieh-zero-shot-reward-specification-via-grounded-natural-language-2022/</loc>
    <lastmod>2024-01-28T09:31:05+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/robotic-arm/</loc>
    <lastmod>2024-01-28T09:31:05+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/allen-z-ren-robots-that-ask-for-help-uncertainty-alignment-2023/</loc>
    <lastmod>2024-01-26T17:29:29+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/future-work/</loc>
    <lastmod>2024-01-26T17:29:29+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/language-ambiguity/</loc>
    <lastmod>2024-01-26T17:29:29+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/uncertainty-estimation/</loc>
    <lastmod>2024-01-26T17:29:29+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llm-agent/</loc>
    <lastmod>2024-01-25T00:55:05+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/llm-for-reward-function/</loc>
    <lastmod>2024-01-25T00:55:05+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/lm-for-uncertainty/</loc>
    <lastmod>2024-01-25T00:55:05+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/marta-skreta-replan-robotic-replanning-2024/</loc>
    <lastmod>2024-01-25T00:55:05+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/binghai-wang-secrets-of-rlhf-reward-modelling-2024/</loc>
    <lastmod>2024-01-24T23:31:28+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/rui-zheng-secrets-of-rlhf-in-llm-part-ppo-2023/</loc>
    <lastmod>2024-01-22T20:26:18+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/zhiting-hu-language-agent-and-world-models-2023/</loc>
    <lastmod>2024-01-22T16:01:20+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/programming-notes/react-js-development-2024/</loc>
    <lastmod>2024-01-21T17:40:43+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/gautier-dagan-dynamic-planning-with-a-llm-2023/</loc>
    <lastmod>2024-01-21T01:42:23+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/instruction-following-robotics-with-pddl/</loc>
    <lastmod>2024-01-21T00:34:56+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jun-wang-conformal-temporal-logic-planning-using-llm-2023/</loc>
    <lastmod>2024-01-21T00:34:56+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/ltl/</loc>
    <lastmod>2024-01-21T00:34:56+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/training-environment/</loc>
    <lastmod>2024-01-21T00:34:56+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/programming-notes/python-and-os-utils-2024/</loc>
    <lastmod>2024-01-18T18:51:51+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/gerevini-plan-constraints-and-preferences-in-pddl3-2005/</loc>
    <lastmod>2024-01-11T19:54:29+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/pddl/</loc>
    <lastmod>2024-01-11T19:54:29+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/nir-lipo-planning-with-perspectives-using-functional-strips-2022/</loc>
    <lastmod>2024-01-11T19:41:55+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/programming-notes/python-logger/</loc>
    <lastmod>2023-12-04T20:25:12+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/alex_coulter-theory-alignment-via-a-classical-encoding-of-regular-bismulation-2022/</loc>
    <lastmod>2023-11-29T17:24:08+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/model-comparison/</loc>
    <lastmod>2023-11-29T17:24:08+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/pascal-bercher-detecting-ai-planning-modelling-mistakes-potential-errors-and-benchmark-domains-2023/</loc>
    <lastmod>2023-11-13T22:33:14+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/planning/</loc>
    <lastmod>2023-11-13T22:33:14+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/large-language-model/</loc>
    <lastmod>2023-10-27T16:44:22+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/reward-design/</loc>
    <lastmod>2023-10-27T16:44:22+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/yecheng-jason-ma-eureka-human-level-reward-design-via-coding-large-language-models-2023/</loc>
    <lastmod>2023-10-27T16:44:22+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/mark-chen-evaluating-large-language-models-trained-on-code-2021/</loc>
    <lastmod>2023-10-16T07:24:26+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/baptiste-roziere-code-llama-open-foundation-model-for-code-2023/</loc>
    <lastmod>2023-10-16T02:58:20+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/haotian-liu-improved-baselines-with-visual-instruction-tuning-2023/</loc>
    <lastmod>2023-10-08T10:37:37+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/multimodal-learning/</loc>
    <lastmod>2023-10-08T10:37:37+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/christabel-wayllace-goal-recognition-design-with-stochastic-agent-action-outcomes-2016/</loc>
    <lastmod>2023-10-06T18:16:28+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/alba-gragera-pddl-domain-repair-fixing-domains-with-incomplete-action-effects-2023/</loc>
    <lastmod>2023-09-20T23:17:51+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/pddl-repair/</loc>
    <lastmod>2023-09-20T23:17:51+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/alba-gragera-exploring-the-limitations-of-using-llms-to-fix-planning-tasks-2023/</loc>
    <lastmod>2023-09-20T20:22:32+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/pddl-fixing/</loc>
    <lastmod>2023-09-20T20:22:32+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/tathagata-chakraborti-plan-explanations-as-model-reconciliation-2017/</loc>
    <lastmod>2023-09-19T22:04:06+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/vishal-pallagani-plansformer-tool-demonstrating-generation-of-symbolic-plans-using-transformers-2023/</loc>
    <lastmod>2023-09-16T00:46:56+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/junnan_li-blip2-boostrapping-language-image-pretraining-2023/</loc>
    <lastmod>2023-08-28T18:48:08+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/multimodal/</loc>
    <lastmod>2023-08-28T18:48:08+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/peng_gao-llama-adapter-v2-2023/</loc>
    <lastmod>2023-08-28T18:47:05+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/programming-notes/langchain-use-cases-2023/</loc>
    <lastmod>2023-08-26T17:36:47+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/reward-machine/</loc>
    <lastmod>2023-08-17T16:32:09+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/rodrigo-reward-machines-exploiting-reward-function-structure-in-rl-2022/</loc>
    <lastmod>2023-08-17T16:32:09+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/rodrigo-using-reward-machines-for-high-level-task-specification-and-decomposition-in-rl-2018/</loc>
    <lastmod>2023-08-17T11:13:24+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/programming-notes/pytorch-multiprocessing-2023/</loc>
    <lastmod>2023-07-18T16:48:13+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/programming-notes/remote-server-and-tmux-2023/</loc>
    <lastmod>2023-07-16T18:45:57+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/william_berrios-towards-language-models-that-can-see-2023/</loc>
    <lastmod>2023-07-03T19:33:22+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/large-language-models/</loc>
    <lastmod>2023-07-02T21:24:50+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/lionel_wong-from-word-models-to-world-models-2023/</loc>
    <lastmod>2023-07-02T21:24:50+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jianning_wang-boosting-language-models-reasoning-with-chain-of-knowledge-prompting-2023/</loc>
    <lastmod>2023-07-02T16:09:58+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/prompting-design/</loc>
    <lastmod>2023-07-02T16:09:58+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/programming-notes/web-scrawler-using-selenium-2023/uc-use-case/</loc>
    <lastmod>2023-06-22T22:38:28+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/programming-notes/web-scrawler-using-selenium-2023/</loc>
    <lastmod>2023-06-22T22:38:28+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/programming-notes/web-scrawler-using-selenium-2023/xpath-cheatsheet/</loc>
    <lastmod>2023-06-22T22:38:28+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/lin_guan-leveraging-pretrained-llm-to-construct-and-utilise-world-models-for-model-based-task-planning-2023/</loc>
    <lastmod>2023-06-04T12:01:46+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/programming-notes/python-module-and-package-management-2023/</loc>
    <lastmod>2023-05-28T11:56:47+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/dharma_kc-neural-machine-translation-for-code-generation-2023/</loc>
    <lastmod>2023-05-28T09:52:32+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jiannan_xiang-language-models-meet-world-models-2023/</loc>
    <lastmod>2023-05-26T01:00:02+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/natural-language-reinforcement-learning/</loc>
    <lastmod>2023-05-26T01:00:02+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/generalised-planning/</loc>
    <lastmod>2023-05-24T19:57:16+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/ryan_yang-pg3-policy-guided-planning-for-generalised-policy-generation-2022/</loc>
    <lastmod>2023-05-24T19:57:16+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/shunyu_yao-tree-of-thoughts-2023/</loc>
    <lastmod>2023-05-24T16:35:10+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/tom_silver-generalised-planning-in-pddl-domains-with-pretrained-large-language-models-2023/</loc>
    <lastmod>2023-05-23T21:27:15+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/yongliang-hugginggpt-2023/</loc>
    <lastmod>2023-05-23T11:57:02+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/yaqi_xie-translating-natural-language-to-planning-goals-with-llm-2023/</loc>
    <lastmod>2023-05-22T12:30:25+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/bo_liu-llmp-empowering-large-language-models-with-optimal-planning-proficiency-2023/</loc>
    <lastmod>2023-05-22T11:56:15+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/siyu_yuan-distilling-script-knowledge-from-large-language-models-for-constrainted-language-planning-2023/</loc>
    <lastmod>2023-05-22T11:31:39+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/junnan_li-blip-bootstrapping-language-image-pre-training-for-unified-vision-language-understanding-and-generation-2022/</loc>
    <lastmod>2023-05-22T11:17:28+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/harsh_jhamtani-natural-language-decomposition-and-interpretation-of-complex-utterances-2023/</loc>
    <lastmod>2023-05-22T09:54:04+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/natural-language-understanding/</loc>
    <lastmod>2023-05-22T09:54:04+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/alexander_kirillov-segment-anything-2023/</loc>
    <lastmod>2023-05-21T11:56:54+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/computer-vision/</loc>
    <lastmod>2023-05-21T11:56:54+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/rohit_gridhar-imagebind-one-embedding-space-to-bind-them-all-2023/</loc>
    <lastmod>2023-05-15T15:06:48+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/qinghao_hitea-hierarchical-temporal-aware-video-language-pre-training-2022/</loc>
    <lastmod>2023-04-06T10:02:22+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/video-captioning/</loc>
    <lastmod>2023-04-06T10:02:22+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/exploration-strategy/</loc>
    <lastmod>2023-04-05T10:02:24+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jacob_andreas-guiding-pretraining-in-reinforcement-learning-with-llms-2023/</loc>
    <lastmod>2023-04-05T10:02:24+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/language-reinforcement-learning/</loc>
    <lastmod>2023-04-05T10:02:24+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/language-model/</loc>
    <lastmod>2023-04-03T15:25:01+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/luke_zettlemoyer-scaling-expert-language-models-with-unsupervised-domain-discovery-2023/</loc>
    <lastmod>2023-04-03T15:25:01+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/xuanting_chen-how-robust-is-gpt35-to-predecessors-a-comprehensive-study-on-language-understanding-tasks/</loc>
    <lastmod>2023-04-03T15:00:57+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/anthony_liu-a-picture-is-worth-a-thousand-words-language-models-plan-from-pixels-2023/</loc>
    <lastmod>2023-04-03T11:28:43+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/wenlong_huang-grounded-decoding-guiding-text-generation-with-grounded-models-for-robot-control-2023/</loc>
    <lastmod>2023-03-30T23:45:18+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/generative-models/</loc>
    <lastmod>2023-03-30T21:20:31+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/goal-conditioned-reinforcement-learning/</loc>
    <lastmod>2023-03-30T21:20:31+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/mariana_learning-generative-models-with-goal-conditioned-reinforcement-learning-2023/</loc>
    <lastmod>2023-03-30T21:20:31+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/hierarchical-reinforcement-learning/</loc>
    <lastmod>2023-03-30T15:01:16+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/itsugun_cho-deep-rl-with-hierarchical-action-exploration-for-dialogue-generation-2023/</loc>
    <lastmod>2023-03-30T15:01:16+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/instruction-following-agent/</loc>
    <lastmod>2023-03-15T21:09:32+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/reinforcement-learning/</loc>
    <lastmod>2023-03-15T21:09:32+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/theodore_r_sumers-how-to-talk-so-ai-will-learn-2022/</loc>
    <lastmod>2023-03-15T21:09:32+08:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/cheng_chi-diffusion-policy-visuomotor-policy-learning-via-action-diffusion-2023/</loc>
    <lastmod>2023-03-09T19:36:17+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/diffusion-model/</loc>
    <lastmod>2023-03-09T19:36:17+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/alan_lindsay-framer-planning-models-from-natural-language-action-descriptions-2017/</loc>
    <lastmod>2023-03-09T19:28:47+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/open-world-reasoning/</loc>
    <lastmod>2023-03-09T19:28:47+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/siddharth_karamcheti-language-driven-representation-learning-for-robotics-2023/</loc>
    <lastmod>2023-03-03T16:16:19+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/tatsuki_kuribayashi-does-vision-accelerate-hierarchical-generalisation-of-neural-language-learners-2023/</loc>
    <lastmod>2023-03-03T15:26:55+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jing_cheng_pang-natural-language-conditioned-reinforcement-learning-with-inside-out-task-language-development-and-translation-2023/</loc>
    <lastmod>2023-03-03T15:19:43+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/suvaansh_bhambri-multi-level-compositional-reasoning-for-interactive-instruction-following-2023/</loc>
    <lastmod>2023-03-03T11:17:01+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/hindsight-instruction-relabeling/</loc>
    <lastmod>2023-03-02T19:06:35+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/tianjun_zhang-the-wisdom-of-hindsight-makes-language-models-better-instruction-followers-2023/</loc>
    <lastmod>2023-03-02T19:06:35+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/ying_shen-learning-by-asking-for-embodied-visual-navigation-and-task-completion-2023/</loc>
    <lastmod>2023-03-02T17:51:02+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/commonsense-learning/</loc>
    <lastmod>2023-03-02T15:22:51+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/ernest_davis-benchmarks-for-automated-commonsense-reasoning-a-survey-2023/</loc>
    <lastmod>2023-03-02T15:22:51+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/alexander_nikulin-anti-exploration-by-random-network-distillation-2023/</loc>
    <lastmod>2023-03-01T22:14:11+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/offline-reinforcement-learning/</loc>
    <lastmod>2023-03-01T22:14:11+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/edoardo_cetin-learning-pessimism-for-reinforcement-learning-2023/</loc>
    <lastmod>2023-03-01T21:02:25+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/prompt-learning/</loc>
    <lastmod>2023-03-01T19:57:49+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/timo_schick-toolformer-language-models-can-teach-themselves-to-use-tools-2023/</loc>
    <lastmod>2023-03-01T19:57:49+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/almog_gueta-knowledge-is-a-region-in-weight-space-for-fine-tuned-language-model-2023/</loc>
    <lastmod>2023-03-01T12:45:54+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/fine-tuning/</loc>
    <lastmod>2023-03-01T12:45:54+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/multitask-learning/</loc>
    <lastmod>2023-03-01T12:45:54+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/contrastive-learning/</loc>
    <lastmod>2023-02-10T02:51:23+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/data-augmentation/</loc>
    <lastmod>2023-02-10T02:51:23+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/xiwen_liang-contrastive-instruction-trajectory-learning-for-vision-language-navigation-2022/</loc>
    <lastmod>2023-02-10T02:51:23+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jacob_andreas-lammp-language-models-as-probabilistic-priors-for-perception-and-action-2023/</loc>
    <lastmod>2023-02-10T00:46:15+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/language-model-reasoning/</loc>
    <lastmod>2023-02-08T22:23:45+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/zhuosheng_zhang-multimodal-chain-of-thought-reasoning-in-language-models-2023/</loc>
    <lastmod>2023-02-08T22:23:45+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/siyuan_wang-unifying-structure-reasoning-and-language-model-pre-training-for-complex-reasoning-2023/</loc>
    <lastmod>2023-02-08T22:17:31+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/ekin_akyurek-towards-tracing-factual-knowledge-in-language-models-back-to-the-training-data-2022/</loc>
    <lastmod>2023-02-08T22:16:28+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/danijar_hafner-mastering-diverse-domains-through-world-models-2023/</loc>
    <lastmod>2023-02-07T18:18:37+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/yuanhan_zhang-what-makes-good-examples-for-visual-in-context-learning-2023/</loc>
    <lastmod>2023-02-06T22:38:35+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jing_yu_koh-grounding-language-models-to-images-for-multimodal-generation-2023/</loc>
    <lastmod>2023-02-06T22:37:53+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/visual-question-answering/</loc>
    <lastmod>2023-02-06T22:36:41+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/zhenfang_chen-see-think-confirm-interactive-prompting-between-vision-and-language-models-for-knowledge-based-visual-reasoning-2023/</loc>
    <lastmod>2023-02-06T22:36:41+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/xiaotian_liu-a-planning-based-neural-symbolic-approach-for-embodied-instruction-following-2022/</loc>
    <lastmod>2023-02-02T13:28:19+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/so_yeon_min-film-following-instructions-in-language-with-modular-methods-2022/</loc>
    <lastmod>2023-02-01T18:32:24+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/yuki_inoue-prompter-utilizing-large-language-model-prompting-for-a-data-efficient-embodied-instruction-following-2022/</loc>
    <lastmod>2023-02-01T17:22:35+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/kyle_mahowald-dissociating-language-and-thought-in-large-language-models-a-cognitive-perspective-2023/</loc>
    <lastmod>2023-01-31T18:47:45+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/michael_janner-planning-with-diffusion-for-flexible-behaviour-synthesis-2022/</loc>
    <lastmod>2023-01-30T13:43:20+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/shailaja_keyur_sampat-reasoning-about-actions-over-visual-and-linguistic-modalities-a-survey-2022/</loc>
    <lastmod>2023-01-20T13:59:00+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/xin_wang-reinforced-cross-modal-matching-and-self-supervised-imitation-learning-for-vision-language-navigation-2019/</loc>
    <lastmod>2023-01-18T09:48:14+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/alekh_agarwal-pcpg-policy-cover-directed-exploration-for-provable-policy-gradient-learning-2020/</loc>
    <lastmod>2022-12-28T14:39:25+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/policy-gradient/</loc>
    <lastmod>2022-12-28T14:39:25+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/alekh_agarwal-on-the-theory-of-policy-gradient-methods-optimality-approximation-and-distribution-shift-2020/</loc>
    <lastmod>2022-12-28T14:36:20+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/chloe_ching_yun_hsu-revisiting-design-choices-in-proximal-policy-optimisation-2020/</loc>
    <lastmod>2022-12-28T14:32:15+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/james_queeney-generalized-proximal-policy-optimisation-with-sample-reuse-2021/</loc>
    <lastmod>2022-12-28T14:00:32+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/lun_wang-backdoorl-backdoor-attack-against-competitive-reinforcement-learning-2021/</loc>
    <lastmod>2022-12-28T03:57:59+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/sandy_huang-adversarial-attacks-on-neural-network-policies-2017/</loc>
    <lastmod>2022-12-28T00:08:22+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/yinglun_xu-efficient-reward-poisoning-attacks-on-online-deep-reinforcement-learning-2022/</loc>
    <lastmod>2022-12-27T23:14:19+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/reward-poisoning/</loc>
    <lastmod>2022-12-27T22:50:14+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/young_wu-reward-poisoning-attacks-on-offline-multi-agent-reinforcement-learning-2022/</loc>
    <lastmod>2022-12-27T22:50:14+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/attack-poisoning/</loc>
    <lastmod>2022-12-27T20:35:10+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/robust-reinforcement-learning/</loc>
    <lastmod>2022-12-27T20:35:10+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/xuezhou_zhang-robust-policy-gradient-against-strong-data-corruption-2021/</loc>
    <lastmod>2022-12-27T20:35:10+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/kiarash_banihashem-defense-against-reward-poisoning-attacks-in-reinforcement-learning-2021/</loc>
    <lastmod>2022-12-27T18:27:17+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/amin_rakhsha-reward-poisoning-in-reinforcement-learning-attacks-against-unknown-learners-in-unknown-environments-2021/</loc>
    <lastmod>2022-12-27T15:50:22+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/xuezhou_zhang-adaptive-reward-poisoning-attacks-against-reinforcement-learning-2020/</loc>
    <lastmod>2022-12-27T00:21:15+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/anindya_sarkar-reward-delay-attacks-on-deep-reinforcement-learning-2022/</loc>
    <lastmod>2022-12-26T21:07:03+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/categories/blog-review/</loc>
    <lastmod>2022-12-26T19:50:35+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/proximal-policy-optimisation-explained-blog/</loc>
    <lastmod>2022-12-26T19:50:35+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/perturbed-rewards/</loc>
    <lastmod>2022-12-26T01:11:23+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/tom_everitt-reinforcement-learning-with-a-corrupted-reward-channel-2017/</loc>
    <lastmod>2022-12-26T01:11:23+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/yunhan_huang-manipulating-reinforcement-learning-stealthy-attacks-on-cost-signals-2020/</loc>
    <lastmod>2022-12-25T19:12:17+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/vincent_zhuang-no-regret-reinforcement-learning-with-heavy-tailed-rewards-2021/</loc>
    <lastmod>2022-12-25T18:15:53+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/wenshuai_zhao-towards-closing-the-sim-to-real-gap-in-collaborative-multi-robot-deep-reinforcement-learning-2020/</loc>
    <lastmod>2022-12-25T16:54:11+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jan_corazza-reinforcement-learning-with-stochastic-reward-machines-2022/</loc>
    <lastmod>2022-12-24T22:36:07+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/non-markovian-rewards/</loc>
    <lastmod>2022-12-24T22:36:07+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/oguzhan_dogru-reinforcement-learning-with-constrained-uncertain-reward-function-through-particle-filtering-2022/</loc>
    <lastmod>2022-12-24T19:32:25+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/inaam_ilahi-challenges-and-countermeasures-for-adversarial-attacks-on-reinforcement-learning-2022/</loc>
    <lastmod>2022-12-24T17:06:12+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/zuxin_liu-on-the-robustness-of-safe-reinforcement-learning-under-observational-perturbations-2022/</loc>
    <lastmod>2022-12-22T22:38:13+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/ruben_majadas-disturbing-reinforcement-learning-agents-with-corrupted-rewards-2021/</loc>
    <lastmod>2022-12-17T00:38:35+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jingkang_wang-reinforcement-learning-with-perturbed-rewards-2020/</loc>
    <lastmod>2022-12-16T20:48:51+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jacob_andreas-language-models-as-agent-models-2022/</loc>
    <lastmod>2022-12-10T00:47:33+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/natural-language-processing/</loc>
    <lastmod>2022-12-10T00:47:33+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/charlie_snell-context-aware-language-modeling-for-goal-oriented-dialogue-systems-2022/</loc>
    <lastmod>2022-11-20T16:29:59+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/sanchit_agarwal-building-goal-oriented-dialogue-systems-with-situated-visual-context-2021/</loc>
    <lastmod>2022-11-20T16:29:14+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/instruction-following/</loc>
    <lastmod>2022-11-20T16:28:23+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/symbolic-planning/</loc>
    <lastmod>2022-11-20T16:28:23+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/yichi_zhang-danli-deliberative-agent-for-following-natural-language-instructions-2022/</loc>
    <lastmod>2022-11-20T16:28:23+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/xiang_li-diffusion_lm_improves_controllable_text_generation_2022/</loc>
    <lastmod>2022-11-14T16:32:31+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/paper_proposal_nov_2022/</loc>
    <lastmod>2022-11-13T15:59:12+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/categories/november-2022-weekly-progress/</loc>
    <lastmod>2022-11-13T15:59:12+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jie_huang-can-language-models-be-specific-how-2022/</loc>
    <lastmod>2022-11-08T20:41:04+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/yizhou_zhao-semantic-aligned-fusion-transformer-for-one-shot-object-detection-2022/</loc>
    <lastmod>2022-10-24T19:14:34+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/ting_i_hsieh-one-shot-object-detection-with-co-attention-and-co-excitation-2019/</loc>
    <lastmod>2022-10-24T19:13:10+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/ayan_kumar_bhunia-a-deep-one-shot-network-for-query-based-logo-retrieval-2019/</loc>
    <lastmod>2022-10-24T19:12:22+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/action-detection/</loc>
    <lastmod>2022-10-20T19:06:41+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/yuetian_weng-an-efficient-spatio-temporal-pyramid-transformer-for-action-detection-2022/</loc>
    <lastmod>2022-10-20T19:06:41+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/steven_kapturowski-human-level-atari-200x-faster-2022/</loc>
    <lastmod>2022-10-05T23:22:01+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/andrea_banino-coberl-contrastive-bert-for-reinforcement-learning-2022/</loc>
    <lastmod>2022-10-05T23:04:49+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/transformer/</loc>
    <lastmod>2022-10-05T23:04:49+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/alex_petrekno-sample-factory-asynchronous-rl-at-very-high-fps-2020/</loc>
    <lastmod>2022-09-25T16:34:09+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jonathan_ho-video-diffusion-models-2022/</loc>
    <lastmod>2022-09-22T20:40:21+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/dongwon-fire-burns-sword-cuts-commonsense-inductive-bias-for-exploration-in-text-based-games-2022/</loc>
    <lastmod>2022-09-22T19:38:56+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/wenlong_huang-language-models-as-zero-shot-planners-extracting-actionable-knowledge-for-embodied-agents-2022/</loc>
    <lastmod>2022-09-19T21:55:13+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/pengchuan_zhang-vinvl-revisiting-visual-representations-in-vision-language-models-2021/</loc>
    <lastmod>2022-09-03T17:17:47+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/xiujun_li-oscar-object-semantic-aligned-pro-training-for-vision-language-tasks-2020/</loc>
    <lastmod>2022-09-03T17:12:54+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/sentence-embeddings/</loc>
    <lastmod>2022-08-27T16:03:42+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/yung_sung_chuang-diffcse-difference-based-contrastive-learning-for-sentence-embeddings-2022/</loc>
    <lastmod>2022-08-27T16:03:42+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/gregor_geigle-retrieve-fast-rerank-smart-coorperative-and-joint-approaches-for-improved-cross-modal-retrieval-2022/</loc>
    <lastmod>2022-08-27T00:31:38+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/kaitao_song-mpnet-masked-and-permuted-retrain-for-language-understanding-2020/</loc>
    <lastmod>2022-08-25T12:24:55+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/sergios_karagiannakos-vision-language-models-towards-multimodal-dl-2022/</loc>
    <lastmod>2022-08-09T07:37:30+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jiali_duan-multimodal-alignment-using-representation-codebook-2022/</loc>
    <lastmod>2022-08-09T07:26:46+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/instruction-following-as-a-path-to-general-problem-solving-agent-aug-2022/</loc>
    <lastmod>2022-08-07T17:17:07+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/phd-thesis-plan/</loc>
    <lastmod>2022-08-07T17:17:07+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/supplementary-notes-for-mindmap-aug-2022/</loc>
    <lastmod>2022-08-04T12:59:17+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/younggyo_seo-masked-world-models-for-visual-control-2022/</loc>
    <lastmod>2022-07-01T12:03:57+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/a-brief-overview-of-rank-based-prioritized-experience-replay-2022/</loc>
    <lastmod>2022-06-02T11:47:17+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/biography/</loc>
    <lastmod>2022-05-31T20:37:09+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/deepmind-flamingo-a-visual-language-model-for-few-shot-learning-2022/</loc>
    <lastmod>2022-05-11T16:35:03+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/angela_fan-augmenting-transformer-with-knn-composite-memory-for-dialog-2021/</loc>
    <lastmod>2022-04-21T11:01:14+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/dialogue-system/</loc>
    <lastmod>2022-04-21T11:01:14+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/categories/future-work/</loc>
    <lastmod>2022-04-21T11:01:14+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/hao_hu-generalisable-episodic-memory-for-drl-2021/</loc>
    <lastmod>2022-04-07T12:12:20+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/memory/</loc>
    <lastmod>2022-04-07T12:12:20+10:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/ilya_kostrikov-offline-rl-with-implicit-q-learning-2021/</loc>
    <lastmod>2022-03-22T19:01:49+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/offline-rl/</loc>
    <lastmod>2022-03-22T19:01:49+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/qinqing_zheng-online-decision-transformer-2022/</loc>
    <lastmod>2022-03-21T21:56:45+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/sebastian_borgeaud-improving-language-models-by-retrieving-from-trillions-of-tokens-2022/</loc>
    <lastmod>2022-03-21T19:07:36+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/machel_reid-can-wikipedia-help-offline-rl-2022/</loc>
    <lastmod>2022-03-16T21:18:24+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/domain-modelling/</loc>
    <lastmod>2022-03-15T16:34:45+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/stephen_cresswell-generalised-domain-model-acquisition-from-action-traces-2013/</loc>
    <lastmod>2022-03-15T16:34:45+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/wenfeng_feng-extracting-action-sequences-from-texts-by-rl/</loc>
    <lastmod>2022-03-15T14:40:38+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/shivam_miglani-nltopddl-learning-from-nlp-manuals-2020/</loc>
    <lastmod>2022-03-14T15:08:45+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/giuseppe_de_giacomo-foundations-for-retraining-bolts-rl-with-ltl-2019/</loc>
    <lastmod>2022-03-04T12:12:57+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/linear-temporal-logic/</loc>
    <lastmod>2022-03-04T12:12:57+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/atari-2600/</loc>
    <lastmod>2022-03-04T12:12:27+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/joseph_kim-collaborative-planning-with-encoding-of-high-level-strategies-2017/</loc>
    <lastmod>2022-03-04T12:12:27+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/mikayel_samvelyan-minihack-the-planet-a-sandbox-for-open-ended-rl-research-2021/</loc>
    <lastmod>2022-03-04T12:11:55+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/nethack/</loc>
    <lastmod>2022-03-04T12:11:55+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/richard_shin-constrained-language-models-yield-few-shot-semantic-parsers-2021/</loc>
    <lastmod>2022-03-02T00:19:18+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/heinrich_kuttler-the-nethack-learning-environment-2020/</loc>
    <lastmod>2022-03-02T00:18:35+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/pashootan_vaezipoor-ltl2action-generalising-ltl-instructions-for-multi-task-rl-2021/</loc>
    <lastmod>2022-03-01T20:53:10+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/roma_patel-learning-to-ground-language-temporal-logical-form-2019/</loc>
    <lastmod>2022-02-28T21:40:53+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/glue/</loc>
    <lastmod>2022-02-28T18:58:52+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/thang_m_pham-out-of-order-how-important-is-the-sequential-order-of-words-in-a-sentence-in-natural-language-understanding-tasks-2021/</loc>
    <lastmod>2022-02-28T18:58:52+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/anton_belyy-guided-k-best-selection-for-semantic-parsing-annotation-2021/</loc>
    <lastmod>2022-02-23T19:42:39+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/semantic-parsing/</loc>
    <lastmod>2022-02-23T19:42:39+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/argumentative-zoning/</loc>
    <lastmod>2022-02-16T14:40:57+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/information-retrieval/</loc>
    <lastmod>2022-02-16T14:40:57+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/s_teufel-argumentative-zoning-2000/</loc>
    <lastmod>2022-02-16T14:40:57+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/categories/thesis-review/</loc>
    <lastmod>2022-02-16T14:40:57+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/compositionality/</loc>
    <lastmod>2022-02-08T14:20:19+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jacob_andreas-compositionality-as-lexical-symmetry-2022/</loc>
    <lastmod>2022-02-08T14:20:19+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/rnn/</loc>
    <lastmod>2022-01-14T00:26:37+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/tao_lei-when-attention-meets-fast-recurrence-training-language-models-with-reduced-compute-2021/</loc>
    <lastmod>2022-01-14T00:26:37+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/alex_nichol-glide-towards-photorealistic-image-generation-and-editing-with-text-guided-diffusion-models-2021/</loc>
    <lastmod>2022-01-12T16:54:01+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/gan/</loc>
    <lastmod>2022-01-12T16:54:01+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/junyang_lin-m6-a-chinese-multimodal-pretrainer-2021/</loc>
    <lastmod>2022-01-12T13:38:14+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/grounded-language-learning/</loc>
    <lastmod>2022-01-03T22:38:40+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/tianshi_cao-babyai-plus-plus-towards-grounded-language-learning-beyond-memorization-2020/</loc>
    <lastmod>2022-01-03T22:38:40+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/federico_bianchi-language-in-a-search-box-grounding-language-learning-in-real-world-human-machine-interaction-2021/</loc>
    <lastmod>2022-01-03T16:51:39+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/imitation-learning/</loc>
    <lastmod>2021-12-24T23:29:49+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/lili_chen-decision-transformer-reinforcement-learning-via-sequence-modeling-2021/</loc>
    <lastmod>2021-12-24T23:29:49+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jiayuan_mao-grammar-based-grounded-lexicon-learning-2021/</loc>
    <lastmod>2021-12-22T17:22:15+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/iglu/</loc>
    <lastmod>2021-12-22T15:10:56+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/julia_kiseleva-interactive-grounded-language-understanding-in-a-collaborative-environment-2021/</loc>
    <lastmod>2021-12-22T15:10:56+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/dominik_drexler-expressing-and-exploiting-the-common-subgoal-structure-of-classical-planning-domains-using-sketches-2021/</loc>
    <lastmod>2021-12-17T13:07:53+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/policy-sketches/</loc>
    <lastmod>2021-12-17T13:07:53+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/width-based-planning/</loc>
    <lastmod>2021-12-17T13:07:53+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/yiding_jiang-language-as-abstraction-for-hierarchical-deep-reinforcement-learning/</loc>
    <lastmod>2021-12-15T19:49:28+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/hengyuan_hu-hierarchical-decision-making-by-generating-and-following-natural-language-instructions-2019/</loc>
    <lastmod>2021-12-15T13:11:05+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/attention-mechanism/</loc>
    <lastmod>2021-12-15T12:59:07+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/causal-reasoning/</loc>
    <lastmod>2021-12-15T12:59:07+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/david_ding-attention-over-learned-object-embeddings-enables-complex-visual-reasoning-2021/</loc>
    <lastmod>2021-12-15T12:59:07+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/object-detection/</loc>
    <lastmod>2021-12-15T12:59:07+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/jacob_andreas-modular-multitask-reinforcement-learning-with-policy-sketches-2017/</loc>
    <lastmod>2021-12-13T17:23:12+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/david_abel-on-the-expressivity-of-markov-reward-2021/</loc>
    <lastmod>2021-12-05T12:02:23+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/evaluation/</loc>
    <lastmod>2021-12-03T19:50:10+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/rishabh_agarwal-deep-reinforcement-learning-at-the-edge-of-the-stats-precipice-2021/</loc>
    <lastmod>2021-12-03T19:50:10+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/borja_ibarz-reward-learning-from-human-preferences-and-demonstrations-in-atari-2018/</loc>
    <lastmod>2021-11-27T19:14:04+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/adrien_ecoffet-go-explore-a-new-approach-for-hard-exploration-problems-2021-paper-review/</loc>
    <lastmod>2021-11-27T18:58:32+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/tuomas_haarnoja-soft-actor-critic-off-policy-maximum-entropy-deep-reinforcement-learning-with-a-stochastic-actor-2018-paper-review/</loc>
    <lastmod>2021-11-18T12:08:53+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/adria-badia-agent57-outperforming-the-atari-human-benchmark-2020-paper-review/</loc>
    <lastmod>2021-11-18T12:05:47+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/stefan-o-toole-width-based-lookaheads-with-learnt-base-policies-and-heuristics-over-the-atari-2600-benchmark-2021-paper-reivew/</loc>
    <lastmod>2021-11-16T17:40:10+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/posts/cristian-paul-bara-mindcraft-theory-of-mind-modelling-2021-paper-review/</loc>
    <lastmod>2021-11-12T12:56:24+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/tags/dataset/</loc>
    <lastmod>2021-11-12T12:56:24+11:00</lastmod>
  </url><url>
    <loc>https://sino-huang.github.io/archives/</loc>
  </url><url>
    <loc>https://sino-huang.github.io/biography/detailed-background/</loc>
  </url><url>
    <loc>https://sino-huang.github.io/biography/publications/</loc>
  </url><url>
    <loc>https://sino-huang.github.io/news/</loc>
  </url><url>
    <loc>https://sino-huang.github.io/search/</loc>
  </url><url>
    <loc>https://sino-huang.github.io/series/</loc>
  </url>
</urlset>
