From de92e626ae768ba667e43272a18a9f5659f44697 Mon Sep 17 00:00:00 2001 From: gfw-report Date: Sat, 20 Jul 2024 00:00:00 +0000 Subject: [PATCH 1/7] Fix a typo in Padmanabhan2021a. --- references.bib | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/references.bib b/references.bib index 94e7e3e..36f25ea 100644 --- a/references.bib +++ b/references.bib @@ -604,7 +604,7 @@ @inproceedings{Basso2021a } @inproceedings{Padmanabhan2021a, - author = {Ramakrishna Padmanabhan and and Arturo Filastò and Maria Xynou and Ram Sundara Raman and Kennedy Middleton and Mingwei Zhang and Doug Madory and Molly Roberts and Alberto Dainotti}, + author = {Ramakrishna Padmanabhan and Arturo Filastò and Maria Xynou and Ram Sundara Raman and Kennedy Middleton and Mingwei Zhang and Doug Madory and Molly Roberts and Alberto Dainotti}, title = {A multi-perspective view of {Internet} censorship in {Myanmar}}, booktitle = {Free and Open Communications on the Internet}, publisher = {ACM}, From 6c62000c8e0966c5615314cbe2f000515d96721c Mon Sep 17 00:00:00 2001 From: gfw-report Date: Sat, 20 Jul 2024 00:00:00 +0000 Subject: [PATCH 2/7] Add ten FOCI'24 issue 2 papers. * PETS publication page: https://www.petsymposium.org/foci/2024/ * FOCI program: https://foci.community/foci24.html#2024-summer-program * Net4People post: https://github.com/net4people/bbs/issues/376 I do not include the three papers in Session III: Privacy Enhancing Technologies, as they are out of scope of Internet censorship. --- references.bib | 90 ++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 90 insertions(+) diff --git a/references.bib b/references.bib index 36f25ea..323ec58 100644 --- a/references.bib +++ b/references.bib @@ -7,6 +7,96 @@ @inproceedings{Kon2024b url = {https://www.cs-pk.com/sec24-spotproxy-final.pdf}, } +@inproceedings{Ahmed2024a, + author = {Mohamed Ahmed and Jeffrey Knockel}, + title = {{Extended Abstract}: The Impact of Online Censorship on {LLMs}}, + booktitle = {Free and Open Communications on the {Internet}}, + publisher = {}, + year = {2024}, + url = {https://www.petsymposium.org/foci/2024/foci-2024-0006.pdf}, +} + +@inproceedings{Gao2024a, + author = {Tianyu Gao and Ping Ji}, + title = {{Extended Abstract}: Leveraging Large Language Models to Identify {Internet} Censorship through Network Data}, + booktitle = {Free and Open Communications on the {Internet}}, + publisher = {}, + year = {2024}, + url = {https://www.petsymposium.org/foci/2024/foci-2024-0007.pdf}, +} + +@inproceedings{Calle2024a, + author = {Paola Calle and Larissa Savitsky and Arjun Nitin Bhagoji and Nguyen Phong Hoang and Shinyoung Cho}, + title = {Toward Automated {DNS} Tampering Detection Using Machine Learning}, + booktitle = {Free and Open Communications on the {Internet}}, + publisher = {}, + year = {2024}, + url = {https://www.petsymposium.org/foci/2024/foci-2024-0008.pdf}, +} + +@inproceedings{Pu2024a, + author = {Michael Pu and Andrew Wang and Anthony Chang and Kieran Quan and Yi Wei Zhou}, + title = {Exploring {Amazon} Simple Queue Service ({SQS}) for Censorship Circumvention}, + booktitle = {Free and Open Communications on the {Internet}}, + publisher = {}, + year = {2024}, + url = {https://www.petsymposium.org/foci/2024/foci-2024-0009.pdf}, +} + +@inproceedings{Vilalonga2024a, + author = {Afonso Vilalonga and João S. Resende and Henrique Domingos}, + title = {Looking at the Clouds: Leveraging Pub/Sub Cloud Services for Censorship-Resistant Rendezvous Channels}, + booktitle = {Free and Open Communications on the {Internet}}, + publisher = {}, + year = {2024}, + url = {https://www.petsymposium.org/foci/2024/foci-2024-0010.pdf}, +} + +@inproceedings{Vines2024b, + author = {Paul Vines}, + title = {Ten Years Gone: Revisiting Cloud Storage Transports to Reduce Censored User Burdens}, + booktitle = {Free and Open Communications on the {Internet}}, + publisher = {}, + year = {2024}, + url = {https://www.petsymposium.org/foci/2024/foci-2024-0011.pdf}, +} + +@inproceedings{Müller2024a, + author = {Philipp Müller and Niklas Niere and Felix Lange and Juraj Somorovsky}, + title = {Turning Attacks into Advantages: Evading {HTTP} Censorship with {HTTP} Request Smuggling}, + booktitle = {Free and Open Communications on the {Internet}}, + publisher = {}, + year = {2024}, + url = {https://www.petsymposium.org/foci/2024/foci-2024-0012.pdf}, +} + +@inproceedings{Hanlon2024a, + author = {Michelina Hanlon and Gerry Wan and Anna Ascheman and Zakir Durumeric}, + title = {Detecting {VPN} Traffic through Encapsulated {TCP} Behavior}, + booktitle = {Free and Open Communications on the {Internet}}, + publisher = {}, + year = {2024}, + url = {https://www.petsymposium.org/foci/2024/foci-2024-0016.pdf}, +} + +@inproceedings{Kujath2024a, + author = {Beau Kujath and Jeffrey Knockel and Paul Aguilar and Diego Morabito and Masashi Crete-Nishihata and Jedidiah R. Crandall}, + title = {Analyzing Prominent Mobile Apps in {Latin America}}, + booktitle = {Free and Open Communications on the {Internet}}, + publisher = {}, + year = {2024}, + url = {https://www.petsymposium.org/foci/2024/foci-2024-0017.pdf}, +} + +@inproceedings{Ruo2024a, + author = {Samuel Ruo and Jeffrey Knockel and Zoë Reichert}, + title = {Lost in Translation: Characterizing Automated Censorship in Online Translation Services}, + booktitle = {Free and Open Communications on the {Internet}}, + publisher = {}, + year = {2024}, + url = {https://www.petsymposium.org/foci/2024/foci-2024-0018.pdf}, +} + @inproceedings{Wang2024a, author = {Chenxu Wang and Jiangyi Yin and Zhao Li and Hongbo Xu and Zhongyi Zhang and Qingyun Liu}, title = {Identifying {VPN} Servers through Graph-Represented Behaviors}, From 863792024d4ffe5ac50e314be3e7d373e3ab726f Mon Sep 17 00:00:00 2001 From: gfw-report Date: Sat, 20 Jul 2024 00:00:00 +0000 Subject: [PATCH 3/7] Do not {Internet} in booktitle. --- references.bib | 20 ++++++++++---------- 1 file changed, 10 insertions(+), 10 deletions(-) diff --git a/references.bib b/references.bib index 323ec58..6f63e02 100644 --- a/references.bib +++ b/references.bib @@ -10,7 +10,7 @@ @inproceedings{Kon2024b @inproceedings{Ahmed2024a, author = {Mohamed Ahmed and Jeffrey Knockel}, title = {{Extended Abstract}: The Impact of Online Censorship on {LLMs}}, - booktitle = {Free and Open Communications on the {Internet}}, + booktitle = {Free and Open Communications on the Internet}, publisher = {}, year = {2024}, url = {https://www.petsymposium.org/foci/2024/foci-2024-0006.pdf}, @@ -19,7 +19,7 @@ @inproceedings{Ahmed2024a @inproceedings{Gao2024a, author = {Tianyu Gao and Ping Ji}, title = {{Extended Abstract}: Leveraging Large Language Models to Identify {Internet} Censorship through Network Data}, - booktitle = {Free and Open Communications on the {Internet}}, + booktitle = {Free and Open Communications on the Internet}, publisher = {}, year = {2024}, url = {https://www.petsymposium.org/foci/2024/foci-2024-0007.pdf}, @@ -28,7 +28,7 @@ @inproceedings{Gao2024a @inproceedings{Calle2024a, author = {Paola Calle and Larissa Savitsky and Arjun Nitin Bhagoji and Nguyen Phong Hoang and Shinyoung Cho}, title = {Toward Automated {DNS} Tampering Detection Using Machine Learning}, - booktitle = {Free and Open Communications on the {Internet}}, + booktitle = {Free and Open Communications on the Internet}, publisher = {}, year = {2024}, url = {https://www.petsymposium.org/foci/2024/foci-2024-0008.pdf}, @@ -37,7 +37,7 @@ @inproceedings{Calle2024a @inproceedings{Pu2024a, author = {Michael Pu and Andrew Wang and Anthony Chang and Kieran Quan and Yi Wei Zhou}, title = {Exploring {Amazon} Simple Queue Service ({SQS}) for Censorship Circumvention}, - booktitle = {Free and Open Communications on the {Internet}}, + booktitle = {Free and Open Communications on the Internet}, publisher = {}, year = {2024}, url = {https://www.petsymposium.org/foci/2024/foci-2024-0009.pdf}, @@ -46,7 +46,7 @@ @inproceedings{Pu2024a @inproceedings{Vilalonga2024a, author = {Afonso Vilalonga and João S. Resende and Henrique Domingos}, title = {Looking at the Clouds: Leveraging Pub/Sub Cloud Services for Censorship-Resistant Rendezvous Channels}, - booktitle = {Free and Open Communications on the {Internet}}, + booktitle = {Free and Open Communications on the Internet}, publisher = {}, year = {2024}, url = {https://www.petsymposium.org/foci/2024/foci-2024-0010.pdf}, @@ -55,7 +55,7 @@ @inproceedings{Vilalonga2024a @inproceedings{Vines2024b, author = {Paul Vines}, title = {Ten Years Gone: Revisiting Cloud Storage Transports to Reduce Censored User Burdens}, - booktitle = {Free and Open Communications on the {Internet}}, + booktitle = {Free and Open Communications on the Internet}, publisher = {}, year = {2024}, url = {https://www.petsymposium.org/foci/2024/foci-2024-0011.pdf}, @@ -64,7 +64,7 @@ @inproceedings{Vines2024b @inproceedings{Müller2024a, author = {Philipp Müller and Niklas Niere and Felix Lange and Juraj Somorovsky}, title = {Turning Attacks into Advantages: Evading {HTTP} Censorship with {HTTP} Request Smuggling}, - booktitle = {Free and Open Communications on the {Internet}}, + booktitle = {Free and Open Communications on the Internet}, publisher = {}, year = {2024}, url = {https://www.petsymposium.org/foci/2024/foci-2024-0012.pdf}, @@ -73,7 +73,7 @@ @inproceedings{Müller2024a @inproceedings{Hanlon2024a, author = {Michelina Hanlon and Gerry Wan and Anna Ascheman and Zakir Durumeric}, title = {Detecting {VPN} Traffic through Encapsulated {TCP} Behavior}, - booktitle = {Free and Open Communications on the {Internet}}, + booktitle = {Free and Open Communications on the Internet}, publisher = {}, year = {2024}, url = {https://www.petsymposium.org/foci/2024/foci-2024-0016.pdf}, @@ -82,7 +82,7 @@ @inproceedings{Hanlon2024a @inproceedings{Kujath2024a, author = {Beau Kujath and Jeffrey Knockel and Paul Aguilar and Diego Morabito and Masashi Crete-Nishihata and Jedidiah R. Crandall}, title = {Analyzing Prominent Mobile Apps in {Latin America}}, - booktitle = {Free and Open Communications on the {Internet}}, + booktitle = {Free and Open Communications on the Internet}, publisher = {}, year = {2024}, url = {https://www.petsymposium.org/foci/2024/foci-2024-0017.pdf}, @@ -91,7 +91,7 @@ @inproceedings{Kujath2024a @inproceedings{Ruo2024a, author = {Samuel Ruo and Jeffrey Knockel and Zoë Reichert}, title = {Lost in Translation: Characterizing Automated Censorship in Online Translation Services}, - booktitle = {Free and Open Communications on the {Internet}}, + booktitle = {Free and Open Communications on the Internet}, publisher = {}, year = {2024}, url = {https://www.petsymposium.org/foci/2024/foci-2024-0018.pdf}, From 7a1e73c11d686a198482abd5e8745b454c655d84 Mon Sep 17 00:00:00 2001 From: gfw-report Date: Sat, 20 Jul 2024 00:00:00 +0000 Subject: [PATCH 4/7] Support accent characters in cite names. MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit A new commit introduces a cite name that contains an accent character: @inproceedings{Müller2024a, It will cause the bibtex parser to fail with the following two errors: failed to extract cite name of: @inproceedings{Müller2024a, and parse failed at 55:17: syntax error: unexpected $end, expecting tCOMM The second error is an upstream limitation, which I will try to get it merged to the upstream: https://github.com/nickng/bibtex. --- src/main.go | 5 +++-- src/vendor/github.com/nickng/bibtex/token.go | 12 +++++++++++- 2 files changed, 14 insertions(+), 3 deletions(-) diff --git a/src/main.go b/src/main.go index d35de8c..08ffd86 100644 --- a/src/main.go +++ b/src/main.go @@ -13,8 +13,9 @@ import ( "github.com/nickng/bibtex" ) -// Matches e.g.: @inproceedings{Doe2024a, -var re = regexp.MustCompile(`@[a-z]*\{([A-Za-z\-]*[0-9]{4}[a-z]),`) +// Matches e.g.: @inproceedings{Müller2024a, +// \p{L}\p{M} matches any letter, including accented characters. +var re = regexp.MustCompile(`@[a-z]*\{([\"\p{L}\p{M}\-]*[0-9]{4}[a-z]),`) // Map a cite name (e.g., Doe2024a) to its line number in the .bib file. All // cite names are unique. diff --git a/src/vendor/github.com/nickng/bibtex/token.go b/src/vendor/github.com/nickng/bibtex/token.go index 17c451e..f26e32a 100644 --- a/src/vendor/github.com/nickng/bibtex/token.go +++ b/src/vendor/github.com/nickng/bibtex/token.go @@ -29,8 +29,18 @@ func isWhitespace(ch rune) bool { return ch == ' ' || ch == '\t' || ch == '\n' || ch == '\r' } +func isAccent(ch rune) bool { + accents := "äöüßéêçñÁÉÍÓÚáéíóúàèìòùâêîôûãõñÄÖÜ" + for _, accent := range accents { + if ch == accent { + return true + } + } + return false +} + func isAlpha(ch rune) bool { - return ('a' <= ch && ch <= 'z') || ('A' <= ch && ch <= 'Z') + return ('a' <= ch && ch <= 'z') || ('A' <= ch && ch <= 'Z') || isAccent(ch) } func isDigit(ch rune) bool { From 792f29e9ce903df6f36e90f20ab1d731990ff7e1 Mon Sep 17 00:00:00 2001 From: gfw-report Date: Sat, 20 Jul 2024 00:00:00 +0000 Subject: [PATCH 5/7] Upgrade nickng/bibtex to v1.4.0. This is to support accent characters in bib key: https://github.com/nickng/bibtex/releases/tag/v1.4.0 --- src/go.mod | 2 +- src/go.sum | 4 ++-- src/vendor/modules.txt | 2 +- 3 files changed, 4 insertions(+), 4 deletions(-) diff --git a/src/go.mod b/src/go.mod index 3f4fb15..fa0c6be 100644 --- a/src/go.mod +++ b/src/go.mod @@ -2,4 +2,4 @@ module censorbib-go go 1.21.3 -require github.com/nickng/bibtex v1.3.0 +require github.com/nickng/bibtex v1.4.0 diff --git a/src/go.sum b/src/go.sum index 44be713..43d9823 100644 --- a/src/go.sum +++ b/src/go.sum @@ -1,2 +1,2 @@ -github.com/nickng/bibtex v1.3.0 h1:iv0408z8Xe+FEVquJUo8eraXnhrAF0e+2/WayPcism8= -github.com/nickng/bibtex v1.3.0/go.mod h1:4BJ3ka/ZjGVXcHOlkzlRonex6U17L3kW6ICEsygP2bg= +github.com/nickng/bibtex v1.4.0 h1:c5lcFG8RSXE0LrxAlkj9jHpYhzgLLKn2feyrUmiIz8A= +github.com/nickng/bibtex v1.4.0/go.mod h1:4BJ3ka/ZjGVXcHOlkzlRonex6U17L3kW6ICEsygP2bg= diff --git a/src/vendor/modules.txt b/src/vendor/modules.txt index f1b35c8..03268cc 100644 --- a/src/vendor/modules.txt +++ b/src/vendor/modules.txt @@ -1,3 +1,3 @@ -# github.com/nickng/bibtex v1.3.0 +# github.com/nickng/bibtex v1.4.0 ## explicit; go 1.18 github.com/nickng/bibtex From 044ab42cc6c6b5c35dd44e2aac1fa5e77f6d57c3 Mon Sep 17 00:00:00 2001 From: gfw-report Date: Sat, 20 Jul 2024 00:00:00 +0000 Subject: [PATCH 6/7] Remove {} for Extended Abstract in the title. --- references.bib | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/references.bib b/references.bib index 6f63e02..01ca95e 100644 --- a/references.bib +++ b/references.bib @@ -9,7 +9,7 @@ @inproceedings{Kon2024b @inproceedings{Ahmed2024a, author = {Mohamed Ahmed and Jeffrey Knockel}, - title = {{Extended Abstract}: The Impact of Online Censorship on {LLMs}}, + title = {Extended Abstract: The Impact of Online Censorship on {LLMs}}, booktitle = {Free and Open Communications on the Internet}, publisher = {}, year = {2024}, @@ -18,7 +18,7 @@ @inproceedings{Ahmed2024a @inproceedings{Gao2024a, author = {Tianyu Gao and Ping Ji}, - title = {{Extended Abstract}: Leveraging Large Language Models to Identify {Internet} Censorship through Network Data}, + title = {Extended Abstract: Leveraging Large Language Models to Identify {Internet} Censorship through Network Data}, booktitle = {Free and Open Communications on the Internet}, publisher = {}, year = {2024}, From eb1fdf5fa2f4041853d82be459c25c979e2169ab Mon Sep 17 00:00:00 2001 From: gfw-report Date: Sat, 20 Jul 2024 00:00:00 +0000 Subject: [PATCH 7/7] Add two PETS'24 papers. Selected from: https://github.com/net4people/bbs/issues/376. --- references.bib | 22 ++++++++++++++++++++++ 1 file changed, 22 insertions(+) diff --git a/references.bib b/references.bib index 01ca95e..3e41d45 100644 --- a/references.bib +++ b/references.bib @@ -7,6 +7,28 @@ @inproceedings{Kon2024b url = {https://www.cs-pk.com/sec24-spotproxy-final.pdf}, } +@article{Vines2024c, + author = {Paul Vines and Samuel McKay and Jesse Jenter and Suresh Krishnaswamy}, + title = {Communication Breakdown: Modularizing Application Tunneling for Signaling Around Censorship}, + journal = {Privacy Enhancing Technologies}, + volume = {2024}, + number = {1}, + publisher = {}, + year = {2024}, + url = {https://petsymposium.org/popets/2024/popets-2024-0027.pdf}, +} + +@article{Tang2024a, + author = {Jenny Tang and Léo Alvarez and Arjun Brar and Nguyen Phong Hoang and Nicolas Christin}, + title = {Automatic Generation of Web Censorship Probe Lists}, + journal = {Privacy Enhancing Technologies}, + volume = {2024}, + number = {4}, + publisher = {}, + year = {2024}, + url = {https://petsymposium.org/popets/2024/popets-2024-0106.pdf}, +} + @inproceedings{Ahmed2024a, author = {Mohamed Ahmed and Jeffrey Knockel}, title = {Extended Abstract: The Impact of Online Censorship on {LLMs}},