package KinoSearch::Analysis::Tokenizer;
use KinoSearch;
1;
__END__
__BINDING__
my $synopsis = <<'END_SYNOPSIS';
my $whitespace_tokenizer
= KinoSearch::Analysis::Tokenizer->new( pattern => '\S+' );
# or...
my $word_char_tokenizer
= KinoSearch::Analysis::Tokenizer->new( pattern => '\w+' );
# or...
my $apostrophising_tokenizer = KinoSearch::Analysis::Tokenizer->new;
# Then... once you have a tokenizer, put it into a PolyAnalyzer:
my $polyanalyzer = KinoSearch::Analysis::PolyAnalyzer->new(
analyzers => [ $case_folder, $word_char_tokenizer, $stemmer ], );
END_SYNOPSIS
my $constructor = <<'END_CONSTRUCTOR';
my $word_char_tokenizer = KinoSearch::Analysis::Tokenizer->new(
pattern => '\w+', # required
);
END_CONSTRUCTOR
Clownfish::Binding::Perl::Class->register(
parcel => "KinoSearch",
class_name => "KinoSearch::Analysis::Tokenizer",
bind_methods => [qw( Set_Token_RE )],
bind_constructors => ["_new"],
make_pod => {
constructor => { sample => $constructor },
synopsis => $synopsis,
},
);
__COPYRIGHT__
Copyright 2005-2010 Marvin Humphrey
This program is free software; you can redistribute it and/or modify
under the same terms as Perl itself.