McGill-NLP
diff --git a/‎docs/README.md
+20 b/‎docs/README.md
+20
diff --git a/‎docs/_includes/masthead.html
+1-1 b/‎docs/_includes/masthead.html
+1-1
diff --git a/‎docs/_pages/home.md
+17-17 b/‎docs/_pages/home.md
+17-17
diff --git a/‎docs/assets/images/booking.1.vcglzhn.messages.webp
116 KB b/‎docs/assets/images/booking.1.vcglzhn.messages.webp
116 KB
diff --git a/‎docs/assets/images/examples/ai.1.oyuiubm.webp
15.5 KB b/‎docs/assets/images/examples/ai.1.oyuiubm.webp
15.5 KB
diff --git a/‎docs/assets/images/examples/booking.1.pxtuocd.webp
13.7 KB b/‎docs/assets/images/examples/booking.1.pxtuocd.webp
13.7 KB
diff --git a/‎docs/assets/images/examples/composing.1.tbtnzql.webp
7.16 KB b/‎docs/assets/images/examples/composing.1.tbtnzql.webp
7.16 KB
diff --git a/‎docs/assets/images/examples/example-1-1.webp
21.6 KB b/‎docs/assets/images/examples/example-1-1.webp
21.6 KB
diff --git a/‎docs/assets/images/examples/example-2-1.webp
19.8 KB b/‎docs/assets/images/examples/example-2-1.webp
19.8 KB
diff --git a/‎docs/assets/images/examples/lookup.1.zbrxcee.webp
27.4 KB b/‎docs/assets/images/examples/lookup.1.zbrxcee.webp
27.4 KB
diff --git a/‎docs/assets/images/examples/productivity.1.ytcgitj.webp
16.6 KB b/‎docs/assets/images/examples/productivity.1.ytcgitj.webp
16.6 KB
diff --git a/‎docs/assets/images/examples/shopping.1.wbamufj.webp
14.8 KB b/‎docs/assets/images/examples/shopping.1.wbamufj.webp
14.8 KB
diff --git a/‎docs/assets/images/examples/social.1.xmrqcyz.webp
21.7 KB b/‎docs/assets/images/examples/social.1.xmrqcyz.webp
21.7 KB
diff --git a/‎docs/assets/images/examples/summarizing.1.bctdmtt.webp
17.3 KB b/‎docs/assets/images/examples/summarizing.1.bctdmtt.webp
17.3 KB
diff --git a/‎docs/assets/images/webnav-figure/webnav-step-1-cropped.png
23.1 KB b/‎docs/assets/images/webnav-figure/webnav-step-1-cropped.png
23.1 KB
diff --git a/‎docs/assets/images/webnav-figure/webnav-step-1-cropped.webp
6.39 KB b/‎docs/assets/images/webnav-figure/webnav-step-1-cropped.webp
6.39 KB
diff --git a/‎docs/assets/images/webnav-figure/webnav-step-1.png
24.5 KB b/‎docs/assets/images/webnav-figure/webnav-step-1.png
24.5 KB
diff --git a/‎docs/assets/images/webnav-figure/webnav-step-2-cropped.png
23.9 KB b/‎docs/assets/images/webnav-figure/webnav-step-2-cropped.png
23.9 KB
diff --git a/‎docs/assets/images/webnav-figure/webnav-step-2-cropped.webp
9.52 KB b/‎docs/assets/images/webnav-figure/webnav-step-2-cropped.webp
9.52 KB
diff --git a/‎docs/assets/images/webnav-figure/webnav-step-2.png
66 KB b/‎docs/assets/images/webnav-figure/webnav-step-2.png
66 KB
diff --git a/‎docs/assets/images/webnav-figure/webnav-step-3-cropped.png
15 KB b/‎docs/assets/images/webnav-figure/webnav-step-3-cropped.png
15 KB
diff --git a/‎docs/assets/images/webnav-figure/webnav-step-3-cropped.webp
3.13 KB b/‎docs/assets/images/webnav-figure/webnav-step-3-cropped.webp
3.13 KB
diff --git a/‎docs/assets/images/webnav-figure/webnav-step-3.png
86.9 KB b/‎docs/assets/images/webnav-figure/webnav-step-3.png
86.9 KB
diff --git a/‎docs/assets/images/webnav-figure/webnav-step-4-cropped.png
16.3 KB b/‎docs/assets/images/webnav-figure/webnav-step-4-cropped.png
16.3 KB
diff --git a/‎docs/assets/images/webnav-figure/webnav-step-4-cropped.webp
5.73 KB b/‎docs/assets/images/webnav-figure/webnav-step-4-cropped.webp
5.73 KB
diff --git a/‎docs/assets/images/webnav-figure/webnav-step-4.png
89.3 KB b/‎docs/assets/images/webnav-figure/webnav-step-4.png
89.3 KB
diff --git a/‎docs/assets/images/webnav-figure/webnav-step-5-cropped.png
21.7 KB b/‎docs/assets/images/webnav-figure/webnav-step-5-cropped.png
21.7 KB
diff --git a/‎docs/assets/images/webnav-figure/webnav-step-5-cropped.webp
5.65 KB b/‎docs/assets/images/webnav-figure/webnav-step-5-cropped.webp
5.65 KB
diff --git a/‎docs/assets/images/webnav-figure/webnav-step-5.png
90.2 KB b/‎docs/assets/images/webnav-figure/webnav-step-5.png
90.2 KB
diff --git a/‎docs/assets/images/webnav.demo.svg
+1-1 b/‎docs/assets/images/webnav.demo.svg
+1-1
diff --git a/‎docs/scripts/convert_to_webp.py
+31 b/‎docs/scripts/convert_to_webp.py
+31
@@ -0,0 +1,20 @@
+## Docs
+
+## Build docs
+
+To build the docs, run this from the project root:
+
+```bash
+python docs/scripts/build_docs.py
+```
+
+It should generate new markdown files in `docs/_docs`.
+
+## Convert images to webp
+
+To convert images to webp, run this from the project root:
+
+```bash
+# convert docs/assets/images/examples
+python docs/scripts/convert_to_webp.py  -d docs/assets/images/examples --height 400
+```
@@ -17,7 +17,7 @@
         <ul class="visible-links">
           {% if site.dark_theme_css %}
           <li class="masthead__menu-item">
-            <a onclick="changeTheme()"><i class="fas fa-fw fa-sun"></i></a>
+            <a name="Change Theme Button" onclick="changeTheme()"><i class="fas fa-fw fa-sun"></i></a>
           </li>
           {% endif %}
 
 
@@ -46,21 +46,21 @@ excerpt: "Real-world website navigation with multi-turn dialogue"
 <img src="{{ '/assets/images/webnav.demo.svg' | relative_url }}" style="width: 90%; max-width: 900px; align-content: center; margin: auto; display: flex">
 
 
-### About WebLINX
+## About WebLINX
 
 WEBLINX is a large-scale benchmark of 100K interactions across 2300 expert demonstrations of *conversational web navigation*.
 Our benchmark covers a broad range of patterns on over 150 real-world websites and can be used to train and evaluate agents in diverse scenarios.
 
-<img src="{{ '/assets/images/examples/ai.1.oyuiubm.png' | relative_url }}" width="24%">
-<img src="{{ '/assets/images/examples/booking.1.pxtuocd.png' | relative_url }}" width="24%">
-<img src="{{ '/assets/images/examples/composing.1.tbtnzql.png' | relative_url }}" width="24%">
-<img src="{{ '/assets/images/examples/lookup.1.zbrxcee.png' | relative_url }}" width="24%">
-<img src="{{ '/assets/images/examples/productivity.1.ytcgitj.png' | relative_url }}" width="24%">
-<img src="{{ '/assets/images/examples/shopping.1.wbamufj.png' | relative_url }}" width="24%">
-<img src="{{ '/assets/images/examples/social.1.xmrqcyz.png' | relative_url }}" width="24%">
-<img src="{{ '/assets/images/examples/summarizing.1.bctdmtt.png' | relative_url }}" width="24%">
+<img loading="lazy" alt="Example of ai tasks" src="{{ '/assets/images/examples/ai.1.oyuiubm.webp' | relative_url }}" width="24%" height="auto">
+<img loading="lazy" alt="Example of booking tasks" src="{{ '/assets/images/examples/booking.1.pxtuocd.webp' | relative_url }}" width="24%" height="auto">
+<img loading="lazy" alt="Example of composing tasks" src="{{ '/assets/images/examples/composing.1.tbtnzql.webp' | relative_url }}" width="24%" height="auto">
+<img loading="lazy" alt="Example of lookup tasks" src="{{ '/assets/images/examples/lookup.1.zbrxcee.webp' | relative_url }}" width="24%" height="auto">
+<img loading="lazy" alt="Example of productivity tasks" src="{{ '/assets/images/examples/productivity.1.ytcgitj.webp' | relative_url }}" width="24%" height="auto">
+<img loading="lazy" alt="Example of shopping tasks" src="{{ '/assets/images/examples/shopping.1.wbamufj.webp' | relative_url }}" width="24%" height="auto">
+<img loading="lazy" alt="Example of social tasks" src="{{ '/assets/images/examples/social.1.xmrqcyz.webp' | relative_url }}" width="24%" height="auto">
+<img loading="lazy" alt="Example of summarizing tasks" src="{{ '/assets/images/examples/summarizing.1.bctdmtt.webp' | relative_url }}" width="24%" height="auto">
 
-### What is *conversational web navigation*?
+## What is *conversational web navigation*?
 
 We propose the problem of *conversational web navigation*, where a digital agent controls a web browser and follows user instructions to solve real-world tasks in a multi-turn dialogue fashion. To accomplish this, agents can learn from expert demonstrations, as shown below:
 
@@ -71,7 +71,7 @@ We propose the problem of *conversational web navigation*, where a digital agent
   </video>
 
   <div style="width: 28%;">
-    <img src="{{'/assets/images/booking.1.vcglzhn.messages.png' | relative_url}}" style="width: 100%; height: auto;">
+    <img src="{{'/assets/images/booking.1.vcglzhn.messages.webp' | relative_url}}" style="width: 100%; height: auto;">
   </div>
 </div>
 
@@ -83,7 +83,7 @@ Here, there should be a 3-column layout with the following content:
 2. The action and conversation history (preferably with nice text formatting)
 3. The screenshot -->
 
-### Can we download WebLINX now?
+## Can we download WebLINX now?
 
 __[You can find our dataset on Huggingface Datasets](https://huggingface.co/datasets/McGill-NLP/weblinx)__
 
@@ -115,7 +115,7 @@ We provide the WebLINX Explorer, a tool to explore the dataset and see the inter
   Your browser does not support the video tag.
 </video>
 
-### What if I want to download the raw data (HTML, screenshots, etc.)?
+## What if I want to download the raw data (HTML, screenshots, etc.)?
 
 If you are interested in the full data, the easiest way to download the raw dataset is the use the `huggingface_hub` library with `snapshot_download`. We show you how in the [doc's prerequisite section]({{'/docs/#prerequisites' | relative_url }}).
 
@@ -130,7 +130,7 @@ pip install weblinx
 Please take a look at the [library documentation]({{'/docs/' | relative_url }}) for more information on how to use it.
 
 
-### How can we use WebLINX to train agents?
+## How can we use WebLINX to train agents?
 
 Our agent is composed of two main components: a __Dense Markup Ranker (DMR)__ and an __action model__.
 
@@ -143,17 +143,17 @@ We experiment with 19 action models, ranging from smaller models (Flan-T5-MindAc
 <!-- There should be a card of 5 models here (MindAct, Pix2Act, Fuyu-8B, LLaMA-13B, GPT-4V) with links to the original papers of those models. -->
 
 
-### Where can we find the finetuned models?
+## Where can we find the finetuned models?
 
 We provide the weights for the models we finetuned. You can [access them on Huggingface Hub](https://huggingface.co/collections/McGill-NLP/weblinx-models-65c57d4afeeb282d1dcf8434). We will share [code to reproduce our experiments on our GitHub repository](https://github.com/mcgill-nlp/weblinx). Please note that they were finetuned for research purposes (so they are not ready for production).
 
-### How do we use the agent to control browsers?
+## How do we use the agent to control browsers?
 
 Our `weblinx` library lets you convert the HTML into a format that can be received by DMR or by an action model, and `weblinx` can also parse valid model outputs into a dictionary that can be converted to browser commands. 
 
 You will need Selenium or Pupeteer to control the browser (take screenshot, grab HTML, insert unique IDs, execute action from dictionary); you can [learn selenium here](https://www.selenium.dev/documentation/webdriver/getting_started/).
 
-### How do we cite WebLINX?
+## How do we cite WebLINX?
 
 If you use our dataset, code, or models, please use the following `bibtex` citation entry:
 
 
@@ -0,0 +1,31 @@
+"""
+Given a path to a directory, convert all images in the directory to webp format.
+"""
+import  argparse
+from pathlib import Path
+
+from PIL import Image
+
+def convert_to_webp(directory: str, height: int = None, quality: int = 80):
+    directory = Path(directory)
+    exts = ['*.jpg', '*.jpeg', '*.png']
+    for ext in exts:
+        for im_path in directory.glob(ext):
+            im = Image.open(im_path)
+            # if height is provided, resize the image
+            if height:
+                im = im.resize((int(im.width * height / im.height), height))
+            
+            im.save(im_path.with_suffix('.webp'), 'webp', quality=quality)
+
+def main():
+    parser = argparse.ArgumentParser(description='Convert all images in a directory to webp format.')
+    parser.add_argument('-d', '--directory', type=str, help='Path to the directory containing images.')
+    parser.add_argument('--height', type=int, help='New height of the output image. If this is provided, we will resize the image to this height.')
+    parser.add_argument('--quality', type=int, help='Quality of the output image.', default=80)
+    args = parser.parse_args()
+    # convert to dict
+    convert_to_webp(**vars(args))
+    
+if __name__ == '__main__':
+    main()