package KinoSearch::Analysis::LCNormalizer; use strict; use warnings; use KinoSearch::Util::ToolSet; use base qw( KinoSearch::Analysis::Analyzer ); use locale; BEGIN { __PACKAGE__->init_instance_vars(); } sub analyze { my ( $self, $batch ) = @_; # lc all of the terms, one by one while ( $batch->next ) { $batch->set_text( lc( $batch->get_text ) ); } $batch->reset; return $batch; } 1; __END__ =head1 NAME KinoSearch::Analysis::LCNormalizer - convert input to lower case =head1 SYNOPSIS my $lc_normalizer = KinoSearch::Analysis::LCNormalizer->new; my $polyanalyzer = KinoSearch::Analysis::PolyAnalyzer->new( analyzers => [ $lc_normalizer, $tokenizer, $stemmer ], ); =head1 DESCRIPTION This class basically says C in a longwinded way which KinoSearch's Analysis apparatus can understand. =head1 CONSTRUCTOR =head2 new Construct a new LCNormalizer. Takes one labeled parameter, C, though it's a no-op for now. =head1 COPYRIGHT Copyright 2005-2006 Marvin Humphrey =head1 LICENSE, DISCLAIMER, BUGS, etc. See L version 0.15. =cut