From 9e9268d6b8400f30e6deb9dada726ae437e6f8c2 Mon Sep 17 00:00:00 2001
From: Sergio Hernandez <contact.sergiohernandez@gmail.com>
Date: Wed, 4 Sep 2024 20:02:33 +0100
Subject: [PATCH] feat: new content (master's thesis update)

---
 components/research/table.vue      | 18 +++++++++---------
 content/research/publications.json | 28 +++++++++++++++++++++++++---
 pages/index.vue                    | 10 +++++-----
 pages/research.vue                 |  7 ++++---
 4 files changed, 43 insertions(+), 20 deletions(-)
diff --git a/components/research/table.vue b/components/research/table.vue
index ccc7980..64a2349 100644
--- a/components/research/table.vue
+++ b/components/research/table.vue
@@ -84,6 +84,11 @@ function onRowClick(event: any) {
             </template>
             <template #empty> No publications found. </template>
             <template #loading> Loading publications data. Please wait. </template>
+            <Column header="Type" field="type" sortable style="min-width: 6rem">
+                <template #body="{ data }">
+                    <Tag :value="data.type" :severity="getType(data.type)" />
+                </template>
+            </Column>
             <Column field="title" header="Title" style="min-width: 12rem">
                 <template #body="{ data }">
                     {{ data.title }}
@@ -94,24 +99,19 @@ function onRowClick(event: any) {
                     {{ data.authors.join(', ') }}
                 </template>
             </Column>
-            <Column field="year" header="Year" sortable style="min-width: 6rem">
+            <Column field="year" header="Year" sortable style="min-width: 5rem">
                 <template #body="{ data }">
                     {{ data.year }}
                 </template>
             </Column>
-            <Column field="venue" header="Venue" sortable style="min-width: 8rem">
+            <Column field="venue" header="Publisher" sortable style="min-width: 6rem">
                 <template #body="{ data }">
                     {{ data.venue }}
                 </template>
             </Column>
-            <Column header="Type" field="type" sortable style="min-width: 6rem">
-                <template #body="{ data }">
-                    <Tag :value="data.type" :severity="getType(data.type)" />
-                </template>
-            </Column>
-            <Column header="Status" field="status" sortable style="min-width: 6rem">
+            <Column field="recognitions" header="Recognitions" style="min-width: 12rem">
                 <template #body="{ data }">
-                    <Tag :value="data.status" :severity="getStatus(data.status)" />
+                    {{ data.recognitions }}
                 </template>
             </Column>
             <Column header="Links" field="links" style="min-width: 6rem">
diff --git a/content/research/publications.json b/content/research/publications.json
index 0852cc4..201cc4e 100644
--- a/content/research/publications.json
+++ b/content/research/publications.json
@@ -1,12 +1,31 @@
 [
+    {
+        "title": "Solving Reasoning Problems with Large Language Models via Recursive Decomposition",
+        "authors": ["Sergio Hernández-Gutiérrez", "Pekka Marttinen", "Alexander Nikitin", "Minttu Alakuijala"],
+        "venue": "Aalto University",
+        "year": "2024",
+        "status": "published",
+        "type": "thesis",
+        "abstract": "This thesis studies the recursive decomposition of reasoning problems with large language models. We propose two methods implementing this technique: one enforcing sub-problem independence during the decomposition of problems and the other enabling the modeling of dependencies between sub-problems. We evaluate these methods on two benchmarks with six difficulty levels each and on two in-context settings with contrasting degrees of task-specific data availability. We find that our methods employing recursive decomposition outperform state-of-the-art baselines as the complexity of the tasks increases while being more time and space-efficient. We additionally provide an analysis of the errors the methods made during our experiments; they also can recover from mistakes made during the problem-solving process. The formulation of our methodology enables its integration into generic intelligent systems safe parallelization of a great part of its execution, as well as its composition with other state-of-the-art frameworks. We open-source our implementation of these methods, along with a wider set of tools to augment the software landscape for reasoning research with large language models.",
+        "recognitions": "",
+        "links": [
+            {
+                "title": "PDF",
+                "url": "https://drive.google.com/file/d/1-7M4VIyXvbIWQL9-pllrtX1UrDSnccgM/view?usp=share_link",
+                "icon": "tabler:file-type-pdf"
+            }
+        ]
+    },
+
     {
         "title": "Following Ancestral Footsteps: Co-Designing Morphology and Behaviour with Self-Imitation Learning",
         "authors": ["Sergio Hernández-Gutiérrez", "Ville Kyrki", "Kevin S. Luck"],
-        "venue": "CoRL",
+        "venue": "EARL (RSS), oral presentation",
         "year": "2024",
-        "status": "submitted",
-        "type": "journal",
+        "status": "published",
+        "type": "workshop",
         "abstract": "In this paper we consider the problem of co-adapting the body and behaviour of agents, a long-standing research problem in the community of evolutionary robotics. Previous work has largely focused on the development of methods exploiting massive parallelization of agent evaluations with large population sizes, a paradigm which is not applicable to the real world. More recent data-efficient approaches utilizing reinforcement learning can suffer from distributional shifts in transition dynamics as well as in state and action spaces when experiencing new body morphologies. In this work, we propose a new co-adaptation method combining reinforcement learning and State-Aligned Self-Imitation Learning. We show that the integration of a self-imitation signal improves the data-efficiency of the co-adaptation process as well as the behavioural recovery when adapting morphological parameters.",
+        "recognitions": "Best Workshop Paper Award",
         "links": [
             {
                 "title": "PDF",
@@ -29,6 +48,7 @@
         "status": "unpublished",
         "type": "seminar",
         "abstract": "Hierarchical reinforcement learning (HRL) methods have recently enabled higher sample efficiency in high-dimensional and long reinforcement learning (RL) problems. Goal-conditioned HRL (GCHRL) approaches concretize these hierarchical ideas by providing reachable sub-goals and considering a chain of policies that model the actions required to reach them, which are either less abstract sub-goals or the agent's native actions. This paper analyses and compares the current state-of-the-art GCHRL methods. Additionally, it discusses the current and future key challenges of the area, including efficient state space exploration, meaningful sub-goal generation and representation, the non-stationarity of policies and the transfer of skills learnt for one problem to solve another. Finally, it contributes to the current discussion on future directions and key focus points within the field of GCHRL.",
+        "recognitions": "",
         "links": [
             {
                 "title": "PDF",
@@ -46,6 +66,7 @@
         "status": "published",
         "type": "thesis",
         "abstract": "During my Bachelor's thesis at UCL, supervised by Prof. Robin Hirsch, I carried out a study on the validity rates of modal logic formulae as their complexity increases (i.e., more allowed connectives and larger formulae). For this purpose, I implemented a frame-based analytical tableau theorem prover for propositional modal logics K, KT, KB, K4, KD and linear modal logic. This implementation was compared to Molle, a state-of-the-art theorem prover for modal logics at the time; this analysis found inconsistencies in the results of both provers, concluding with evidence of Molle's incorrectness on complex formulae.",
+        "recognitions": "",
         "links": [
             {
                 "title": "PDF",
@@ -63,6 +84,7 @@
         "status": "published",
         "type": "article",
         "abstract": "In this article in partnership with Microsoft, as a Microsoft Student Partner, I give an introduction to 3D reconstruction of physical objects. In particular, I explain the process of reconstructing fire-damaged parchments and, as part of my 2nd year project at UCL, building a product for archivists and other professionals who are in need of a parchment-reconstruction tool to read them.",
+        "recognitions": "",
         "links": [
             {
                 "title": "Microsoft Faculty Connection",
diff --git a/pages/index.vue b/pages/index.vue
index 3ca2029..0337b19 100644
--- a/pages/index.vue
+++ b/pages/index.vue
@@ -37,8 +37,9 @@ definePageMeta({
                 </div>
                 <div class="max-w-2xl space-y-4">
                     <p>I am a Machine Learning Scientist currently looking for
-                        PhD opportunities. My current research interests revolve around employing deep models to solve
-                        complex <strong>reasoning or decision-making tasks</strong>, how <strong>knowledge and data
+                        PhD opportunities. My current research interests revolve around employing <strong>deep
+                            models</strong> to solve
+                        complex <strong>reasoning and decision-making tasks</strong>, how <strong>knowledge and data
                             representation</strong> affects such
                         capabilities, as well as learning the reinforcement learning process
                         (<strong>meta-learning</strong>) outside of
@@ -62,10 +63,9 @@ definePageMeta({
                     </p>
                 </div>
                 <div class="flex gap-6">
-                    <a v-for="social in socials":key="social.title":href="social.url":title="social.title"
+                    <a v-for="social in socials" :key="social.title" :href="social.url" :title="social.title"
                         class="text-zinc-600 transition hover:text-zinc-300" rel="me nofollow noopener" target="_blank">
-                        <icon :name="social.icon" class="h-6
-w-6" />
+                        <icon :name="social.icon" class="h-6 w-6" />
                     </a>
                 </div>
             </div>
diff --git a/pages/research.vue b/pages/research.vue
index 73a72ff..6923c4c 100644
--- a/pages/research.vue
+++ b/pages/research.vue
@@ -20,10 +20,11 @@ function togglePopup(publication: any) {
                     Current interests
                 </h1>
                 <div class="flex flex-col gap-2">
-                    <p>I am currently working on my <strong>Master's thesis</strong>, exploring how large foundation
+                    <p>I recently submitted my <strong>Master's thesis</strong>, exploring how language
                         models can be used
                         to
-                        solve <strong>multi-step reasoning problems via task decomposition</strong>.
+                        solve <strong>multi-step reasoning problems via task decomposition</strong> as te complexity of
+                        the tasks increases.
                         My <strong>interests</strong> at the moment include:</p>
                     <ul class="list-disc pl-6">
                         <li><strong>Knowledge representation</strong> in deep models (e.g., latent embedding spaces),
@@ -32,7 +33,7 @@ function togglePopup(publication: any) {
                             languages.
                         </li>
                         <li>Deep architectures and methods for solving complex <strong>reasoning problems</strong>
-                            (e.g., mathematics or logic).
+                            (e.g., mathematics, programming tasks, planning, etc.).
                         </li>
                         <li><strong>Reinforcement and imitation learning</strong>, particularly meta-learning the RL/IL
                             process outside of classical algorithmic approaches.</li>