@inproceedings{ravi_knight_mtdec_acl11,
author = {Sujith Ravi and
Kevin Knight},
title = {Deciphering Foreign Language},
booktitle = {Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies (ACL-HLT)},
year = {2011},
url = {http://aclweb.org/anthology/P/P11/P11-1002.pdf},
abstract = {In this work, we tackle the task of machine translation (MT) without parallel training data. We frame the MT problem as a decipherment task, treating the foreign text as a cipher for English and present novel methods for training translation models from non-parallel text.}
}
@inproceedings{ravi_knight_bayesdec_acl11,
author = {Sujith Ravi and
Kevin Knight},
title = {Bayesian Inference for {Z}odiac and Other Homophonic Ciphers},
booktitle = {Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies (ACL-HLT)},
year = {2011},
url = {http://aclweb.org/anthology/P/P11/P11-1025.pdf},
abstract = {We introduce a novel Bayesian approach for deciphering complex substitution ciphers. Our method uses a decipherment model which combines information from letter n-gram language models as well as word dictionaries. Bayesian inference is performed on our model using an efficient sampling technique. We evaluate the quality of the Bayesian decipherment output on simple and homophonic letter substitution ciphers and show that unlike a previous approach, our method consistently produces almost 100\% accurate decipherments. The new method can be applied on more complex substitution ciphers and we demonstrate its utility by cracking the famous Zodiac-408 cipher in a fully automated fashion, which has never been done before.}
}
@inproceedings{srlccg_ijcnlp11,
author = {Stephen Boxwell and Chris Brew and Jason Baldridge and Dennis Mehay and Sujith Ravi},
title = {Semantic {R}ole {L}abeling Without Treebanks},
booktitle = {Proceedings of the International Joint Conference on Natural Language Processing (IJCNLP).},
year = {2011}
}
@inproceedings{kozareva-ravi_emnlp11_unsup-ws,
author = {Kozareva, Zornitsa and Ravi, Sujith},
title = {Unsupervised Name Ambiguity Resolution Using A Generative Model},
booktitle = {Proceedings of the EMNLP Workshop on Unsupervised Learning in NLP},
year = {2011}
}
@inproceedings{ravi_et_al-coling10,
author = {Sujith Ravi and
Ashish Vaswani and
Kevin Knight and
David Chiang},
title = {Fast, Greedy Model Minimization for Unsupervised Tagging},
booktitle = {Proceedings of the 23rd International Conference on Computational Linguistics (COLING)},
year = {2010},
pages = {940--948},
url = {http://aclweb.org/anthology/C/C10/C10-1106.pdf},
abstract = {Model minimization has been shown to work well for the task of unsupervised part-of-speech tagging with a dictionary. In Ravi and Knight (2009), the authors invoke an integer programming (IP) solver to do model minimization. However, solving this problem exactly using an integer programming formulation is intractable for practical purposes. We propose a novel two-stage greedy approximation scheme to replace the IP. Our method runs fast, while yielding highly accurate tagging results. We also compare our method against standard EM training, and show that we consistently obtain better tagging accuracies on test data of varying sizes for English and Italian.}
}
@inproceedings{ravi:baldridge:knight-acl10,
author = {Suijth Ravi and
Jason Baldridge and
Kevin Knight},
title = {Minimized models and grammar-informed initialization for supertagging with highly ambiguous lexicons},
booktitle = {Proceedings of the 48th Annual Meeting of the Association for Computational Linguistics (ACL)},
year = {2010},
pages = {495--503},
url = {http://www.aclweb.org/anthology/P10-1051.pdf},
abstract = {We combine two complementary ideas
for learning supertaggers from highly ambiguous
lexicons: grammar-informed tag
transitions and models minimized via integer
programming. Each strategy on its
own greatly improves performance over
basic expectation-maximization training
with a bitag Hidden Markov Model, which
we show on the CCGbank and CCG-TUT
corpora. The strategies provide further error
reductions when combined. We describe
a new two-stage integer programming
strategy that efficiently deals with
the high degree of ambiguity on these
datasets while obtaining the full effect of
model minimization.}
}
@article{ravi:knight-compling09,
author = {Sujith Ravi and
Kevin Knight},
title = {Does {GIZA}++ Make Search Errors?},
journal = {Computational Linguistics},
volume = {36},
number = {3},
pages = {295--302},
year = {2010},
url = {http://www.aclweb.org/anthology/J/J10/J10-3001.pdf},
abstract = {Word alignment is a critical procedure within statistical machine translation (SMT). Brown et
al. (1993) have provided the most popular word alignment algorithm to date, one that has been
implemented in GIZA (Al-Onaizan et al. 1999) and GIZA++ (Och and Ney 2003) software and
adopted by nearly every SMT project. In this paper, we investigate whether this algorithm makes
search errors when it computes Viterbi alignments, i.e., whether it returns alignments that are
sub-optimal according to a trained model.}
}
@incollection{kim:shaw:ravi-edm-book10,
author = {Jihie Kim and
Erin Shaw and
Sujith Ravi},
title = {Mining Student Discussions to Profile Participation and Scaffold Learning},
booktitle = {The Handbook of Educational Data Mining},
editor = {Cristobal Romero and Sebastian Ventura and Mykola Pechenizkiy and Ryan Baker},
publisher = {CRC Press},
year = {2010},
pages = {299--310}
}
@inproceedings{chiang_et_al-naacl10,
author = {David Chiang and
Jonathan Graehl and
Kevin Knight and
Adam Pauls and
Sujith Ravi},
title = {Bayesian Inference for Finite-State Transducers},
booktitle = {Proceedings of the Conference of the North American Chapter of the Association for Computational Linguistics - Human Language Technologies (NAACL/HLT)},
year = {2010},
pages = {447--455},
url = {http://aclweb.org/anthology/N/N10/N10-1068.pdf},
abstract = {We describe a Bayesian inference algorithm
that can be used to train any cascade of
weighted finite-state transducers on end-toend
data. We also investigate the problem
of automatically selecting from among multiple
training runs. Our experiments on four
dierent tasks demonstrate the genericity of
this framework, and, where applicable, large
improvements in performance over EM. We
also show, for unsupervised part-of-speech
tagging, that automatic run selection gives a
large improvement over previous Bayesian approaches.}
}
@inproceedings{ravi_et_al-wsdm10,
author = {Sujith Ravi and
Andrei Z. Broder and
Evgeniy Gabrilovich and
Vanja Josifovski and
Sandeep Pandey and
Bo Pang},
title = {Automatic generation of bid phrases for online advertising},
booktitle = {Proceedings of the International Conference on Web Search and Data Mining (WSDM)},
year = {2010},
pages = {341--350},
url = {http://research.yahoo.com/files/wsdm246-ravi.pdf},
abstract = {One of the most prevalent online advertising methods is textual
advertising. To produce a textual ad, an advertiser
must craft a short creative (the text of the ad) linking to a
landing page, which describes the product or service being
promoted. Furthermore, the advertiser must associate the
creative to a set of manually chosen bid phrases representing
those Web search queries that should trigger the ad. For
efficiency, given a landing page, the bid phrases are often
chosen first, and then for each bid phrase the creative is
produced using a template. Nevertheless, an ad campaign
(e.g., for a large retailer) might involve thousands of landing
pages and tens or hundreds of thousands of bid phrases,
hence the entire process is very laborious. \\ \\
Our study aims towards the automatic construction of online
ad campaigns: given a landing page, we propose several
algorithmic methods to generate bid phrases suitable for the
given input. Such phrases must be both relevant (that is, reflect
the content of the page) and well-formed (that is, likely
to be used as queries to a Web search engine). To this end,
we use a two phase approach. First, candidate bid phrases
are generated by a number of methods, including a (monolingual)
translation model capable of generating phrases not
contained within the text of the input as well as previously
``unseen'' phrases. Second, the candidates are ranked in a
probabilistic framework using both the translation model,
which favors relevant phrases, as well as a bid phrase language
model, which favors well-formed phrases. \\ \\
Empirical evaluation based on a real-life corpus of advertisercreated
landing pages and associated bid phrases confirms
the value of our approach, which successfully re-generates
many of the human-crafted bid phrases and performs significantly
better than a pure text extraction method.}
}
@inproceedings{ravi:knight-acl09,
author = {Ravi, Sujith and Knight, Kevin},
title = {Minimized models for unsupervised part-of-speech tagging},
booktitle = {Proceedings of the Joint Conferenceof the 47th Annual Meeting of the Association for Computational Linguistics and the 4th International Joint Conference on Natural Language Processing of the Asian Federation of Natural Language Processing (ACL-IJCNLP)},
year = {2009},
pages = {504--512},
url = {http://aclweb.org/anthology/P/P09/P09-1057.pdf},
note = {\textbf{Nominated for the Best Paper Award}},
abstract = {We describe a novel method for the task
of unsupervised POS tagging with a dictionary,
one that uses integer programming
to explicitly search for the smallest model
that explains the data, and then uses EM
to set parameter values. We evaluate our
method on a standard test corpus using
different standard tagsets (a 45-tagset as
well as a smaller 17-tagset), and show that
our approach performs better than existing
state-of-the-art systems in both settings.}
}
@inproceedings{bodrumlu:knight:ravi-naacl09_ilp-ws,
author = {Bodrumlu, Tugba and Knight, Kevin and Ravi, Sujith},
title = {A new objective function for word alignment},
booktitle = {Proceedings of the NAACL/HLT Workshop on Integer Programming for Natural Language Processing},
year = {2009},
pages = {28--35},
url = {http://aclweb.org/anthology-new/W/W09/W09-1804.pdf},
abstract = {We develop a new objective function for word
alignment that measures the size of the bilingual
dictionary induced by an alignment. A
word alignment that results in a small dictionary
is preferred over one that results in a large
dictionary. In order to search for the alignment
that minimizes this objective, we cast the
problemas an integer linear program. We then
extend our objective function to align corpora
at the sub-word level, which we demonstrate
on a small Turkish-English corpus.}
}
@inproceedings{ravi:knight-naacl09,
author = {Ravi, Sujith and Knight, Kevin},
title = {Learning phoneme mappings for transliteration without parallel data},
booktitle = {Proceedings of Conference of the North American Chapter of the Association for Computational Linguistics - Human Language Technologies (NAACL/HLT)},
year = {2009},
pages = {37--45},
url = {http://aclweb.org/anthology/N/N09/N09-1005.pdf},
abstract = {We present a method for performing machine
transliteration without any parallel resources.
We frame the transliteration task as a decipherment
problem and show that it is possible
to learn cross-language phoneme mapping
tables using only monolingual resources. We
compare various methods and evaluate their
accuracies on a standard name transliteration
task.}
}
@inproceedings{ravi:knight-iccpol09,
author = {Sujith Ravi and
Kevin Knight},
title = {Probabilistic Methods for a Japanese Syllable Cipher},
booktitle = {Proceedings of the 22nd International Conference on the Computer Processing of Oriental Languages (ICCPOL)},
year = {2009},
pages = {270-281},
url = {http://www.springerlink.com/content/r7113hp62731745t/fulltext.pdf},
abstract = {This paper attacks a Japanese syllable-substitution cipher.
We use a probabilistic, noisy-channel framework, exploiting various Japanese
language models to drive the decipherment. We describe several innova-
tions, including a new objective function for searching for the highest-
scoring decipherment. We include empirical studies of the relevant phenomena,
and we give improved decipherment accuracy rates.}
}
@article{ravi:knight-cryptologia09,
author = {Sujith Ravi and
Kevin Knight},
title = {Attacking Letter Substitution Ciphers with Integer Programming},
journal = {Cryptologia},
volume = {33},
number = {4},
year = {2009},
pages = {321-334},
url = {http://www.informaworld.com/10.1080/01611190903030920},
abstract = {We introduce a method for solving substitution ciphers using low-order letter n-gram models. This method enforces global constraints using integer programming, and it guarantees that no decipherment key is overlooked. We carry out extensive empirical experiments showing how decipherment accuracy varies as a function of cipher length and n-gram order. We also make an empirical investigation of Shannon's (1949) theory of uncertainty in decipherment.}
}
@inproceedings{ravi:knight-emnlp08,
author = {Sujith Ravi and
Kevin Knight},
title = {Attacking Decipherment Problems Optimally with Low-Order
N-gram Models},
booktitle = {Proceedings of Conference on Empirical Methods in Natural Language Processing (EMNLP)},
year = {2008},
pages = {812-819},
url = {www.aclweb.org/anthology/D08-1085.pdf},
abstract = {We introduce a method for solving substitution
ciphers using low-order letter n-gram
models. This method enforces global constraints
using integer programming, and it
guarantees that no decipherment key is overlooked.
We carry out extensive empirical experiments
showing how decipherment accuracy
varies as a function of cipher length and
n-gram order. We also make an empirical investigation
of ShannonŐs (1949) theory of uncertainty
in decipherment.}
}
@inproceedings{ravi:knight:soricut-emnlp08,
author = {Sujith Ravi and
Kevin Knight and
Radu Soricut},
title = {Automatic Prediction of Parser Accuracy},
booktitle = {Proceedings of Conference on Empirical Methods in Natural Language Processing (EMNLP)},
year = {2008},
pages = {887-896},
url = {http://www.aclweb.org/anthology/D08-1093.pdf},
abstract = {Statistical parsers have become increasingly
accurate, to the point where they are useful in
many natural language applications. However,
estimating parsing accuracy on a wide variety
of domains and genres is still a challenge in
the absence of gold-standard parse trees.
In this paper, we propose a technique that automatically
takes into account certain characteristics
of the domains of interest, and accurately
predicts parser performance on data
from these new domains. As a result, we have
a cheap (no annotation involved) and effective
recipe for measuring the performance of a statistical
parser on any given domain.}
}
@inproceedings{ravi:pasca-cikm08,
author = {Sujith Ravi and
Marius Pasca},
title = {Using structured text for large-scale attribute extraction},
booktitle = {Proceedings of the 17th ACM Conference on Information and Knowledge Management (CIKM)},
year = {2008},
pages = {1183-1192},
url = {http://dl.acm.org/citation.cfm?id=1458238},
abstract = {We propose a weakly-supervised approach for extracting
class attributes from structured text available within Web
documents. The overall precision of the extracted attributes
is around 30\% higher than with previous methods operating
on Web documents. In addition to attribute extraction, this
approach also automatically identifies values for a subset of
the extracted class attributes.}
}
@inproceedings{kim_et_al-its08,
author = {Jihie Kim and
Erin Shaw and
Sujith Ravi and
Erin Tavano and
Aniwat Arromratana and
Pankaj Sarda},
title = {Scaffolding On-Line Discussions with Past Discussions: An Analysis and Pilot Study of PedaBot},
booktitle = {Proceedings of the 9th International Conference on Intelligent Tutoring Systems Conference (ITS)},
year = {2008},
pages = {343-352},
url = {http://www.springerlink.com/content/c0p21873t787q388/fulltext.pdf},
abstract = {PedaBot is a new discussion scaffolding application designed to aid
student knowledge acquisition, promote reflection about course topics and
encourage student participation in discussions. It dynamically processes student
discussions and presents related discussions from a knowledge base of past
discussions. This paper describes the system and presents a comparative
analysis of the information retrieval techniques used to respond to free-form
student discussions, a combination of topic profiling, term frequency-inverse
document frequency, and latent semantic analysis. Responses are presented as
annotated links that students can follow and rate. We report a pilot study of
PedaBot based on student viewings, student ratings, and a small survey. Initial
results indicate that there is a high level of student interest in the feature and
that its responses are moderately relevant to student discussions.}
}
@inproceedings{ravi:kim-aied07a,
author = {Sujith Ravi and
Jihie Kim},
title = {Profiling Student Interactions in Threaded Discussions with Speech Act Classifiers},
booktitle = {Proceedings of the 13th International Conference on Artificial Intelligence in Education (AIED)},
year = {2007},
pages = {357-364},
url = {www.isi.edu/~jihie/papers/ThreadAssessmt-AIED2007.pdf},
abstract = {On-line discussion is a popular form of web-based computer-mediated
communication and is an important medium for distance education. Automatic
tools for analyzing online discussions are highly desirable for better information
management and assistance. This paper presents an approach for automatically
profiling student interactions in on-line discussions. Using N-gram features and
linear SVM, we developed ``speech act'' classifiers that identify the roles that
individual messages play. The classifiers were used in finding messages that
contain questions or answers. We then applied a set of thread analysis rules for
identifying threads that may have unanswered questions and need instructor
attention. We evaluated the results with three human annotators, and 70-75\% of
the predictions from the system were consistent with human answers.}
}
@inproceedings{ravi:kim:shaw-aied07b_edm-ws,
author = {Sujith Ravi and Jihie Kim and Erin Shaw},
title = {Mining On-line Discussions: Assessing Technical Quality for Student Scaffolding and Classifying Messages for Participation Profiling},
booktitle = {Proceedings of the Educational Data Mining Workshop in the 13th International Conference on Artificial Intelligence in Education (AIED)},
year = 2007,
abstract = {On-line collaborative discussions play an important role in distance
education and web-enhanced courses. Automatic tools for assessing student
activities and promoting collaborative problem solving can provide a better
learning experience for students and also offer useful assistance to teachers. This
paper presents two novel instructional tools that apply data mining and
information retrieval techniques. First, we describe an approach that could be
used to scaffold undergraduate student discussions by retrieving useful
information from past student discussions. The tool exploits both the discussions
from the same undergraduate course and the ones from a graduate-level course.
The second part of the paper presents an instructional tool that profiles student
contributions with respect to student genders and the roles that students play in
discussion. We apply speech act classifiers that automatically identify whether the
given message contains questions and/or answers, and use the classification
results in profiling male and female student contributions. Our initial evaluation
of the scaffolding tool shows that discussions from the same course contain more
number of similar concepts than the ones from the graduate-level course. However,
technical quality of graduate-level discussions is higher. The results from the
profiling tool indicate that female participation in undergraduate-level discussions
is lower than that in graduate-level discussions, and graduate female students post
more questions and answers compared to undergraduate female students.}
}
This file was generated by bibtex2html 1.96.