1 package FS::cust_main::Search;
4 use base qw( Exporter );
5 use vars qw( @EXPORT_OK $DEBUG $me $conf @fuzzyfields );
6 use String::Approx qw(amatch);
8 use FS::Record qw( qsearch );
10 use FS::cust_main_invoice;
13 @EXPORT_OK = qw( smart_search );
15 # 1 is mostly method/subroutine entry and options
16 # 2 traces progress of some operations
17 # 3 is even more information including possibly sensitive data
19 $me = '[FS::cust_main::Search]';
21 @fuzzyfields = ( 'first', 'last', 'company', 'address1' );
23 install_callback FS::UID sub {
25 #yes, need it for stuff below (prolly should be cached)
30 FS::cust_main::Search - Customer searching
34 use FS::cust_main::Search;
36 FS::cust_main::Search::smart_search(%options);
38 FS::cust_main::Search::email_search(%options);
40 FS::cust_main::Search->search( \%options );
42 FS::cust_main::Search->fuzzy_search( \%fuzzy_hashref );
48 =item smart_search OPTION => VALUE ...
50 Accepts the following options: I<search>, the string to search for. The string
51 will be searched for as a customer number, phone number, name or company name,
52 as an exact, or, in some cases, a substring or fuzzy match (see the source code
53 for the exact heuristics used); I<no_fuzzy_on_exact>, causes smart_search to
54 skip fuzzy matching when an exact match is found.
56 Any additional options are treated as an additional qualifier on the search
59 Returns a (possibly empty) array of FS::cust_main objects.
66 #here is the agent virtualization
68 $FS::CurrentUser::CurrentUser->agentnums_sql(table => 'cust_main');
72 my $skip_fuzzy = delete $options{'no_fuzzy_on_exact'};
73 my $search = delete $options{'search'};
74 ( my $alphanum_search = $search ) =~ s/\W//g;
76 if ( $alphanum_search =~ /^1?(\d{3})(\d{3})(\d{4})(\d*)$/ ) { #phone# search
78 #false laziness w/Record::ut_phone
79 my $phonen = "$1-$2-$3";
80 $phonen .= " x$4" if $4;
82 push @cust_main, qsearch( {
83 'table' => 'cust_main',
84 'hashref' => { %options },
85 'extra_sql' => ( scalar(keys %options) ? ' AND ' : ' WHERE ' ).
87 join(' OR ', map "$_ = '$phonen'",
89 ship_daytime ship_night ship_fax )
92 " AND $agentnums_sql", #agent virtualization
95 unless ( @cust_main || $phonen =~ /x\d+$/ ) { #no exact match
96 #try looking for matches with extensions unless one was specified
98 push @cust_main, qsearch( {
99 'table' => 'cust_main',
100 'hashref' => { %options },
101 'extra_sql' => ( scalar(keys %options) ? ' AND ' : ' WHERE ' ).
103 join(' OR ', map "$_ LIKE '$phonen\%'",
105 ship_daytime ship_night )
108 " AND $agentnums_sql", #agent virtualization
113 # custnum search (also try agent_custid), with some tweaking options if your
114 # legacy cust "numbers" have letters
118 if ( $search =~ /@/ ) {
122 'table' => 'cust_main_invoice',
123 'hashref' => { 'dest' => $search },
126 } elsif ( $search =~ /^\s*(\d+)\s*$/
127 || ( $conf->config('cust_main-agent_custid-format') eq 'ww?d+'
128 && $search =~ /^\s*(\w\w?\d+)\s*$/
130 || ( $conf->config('cust_main-custnum-display_special')
131 # it's not currently possible for special prefixes to contain
132 # digits, so just strip off any alphabetic prefix and match
133 # the rest to custnum
134 && $search =~ /^\s*[[:alpha:]]*(\d+)\s*$/
136 || ( $conf->exists('address1-search' )
137 && $search =~ /^\s*(\d+\-?\w*)\s*$/ #i.e. 1234A or 9432-D
144 if ( $num =~ /^(\d+)$/ && $num <= 2147483647 ) { #need a bigint custnum? wow
145 push @cust_main, qsearch( {
146 'table' => 'cust_main',
147 'hashref' => { 'custnum' => $num, %options },
148 'extra_sql' => " AND $agentnums_sql", #agent virtualization
152 # for all agents this user can see, if any of them have custnum prefixes
153 # that match the search string, include customers that match the rest
154 # of the custnum and belong to that agent
155 foreach my $agentnum ( $FS::CurrentUser::CurrentUser->agentnums ) {
156 my $p = $conf->config('cust_main-custnum-display_prefix', $agentnum);
158 if ( $p eq substr($num, 0, length($p)) ) {
159 push @cust_main, qsearch( {
160 'table' => 'cust_main',
161 'hashref' => { 'custnum' => 0 + substr($num, length($p)),
162 'agentnum' => $agentnum,
169 push @cust_main, qsearch( {
170 'table' => 'cust_main',
171 'hashref' => { 'agent_custid' => $num, %options },
172 'extra_sql' => " AND $agentnums_sql", #agent virtualization
175 if ( $conf->exists('address1-search') ) {
176 my $len = length($num);
178 foreach my $prefix ( '', 'ship_' ) {
179 push @cust_main, qsearch( {
180 'table' => 'cust_main',
181 'hashref' => { %options, },
183 ( keys(%options) ? ' AND ' : ' WHERE ' ).
184 " LOWER(SUBSTRING(${prefix}address1 FROM 1 FOR $len)) = '$num' ".
185 " AND $agentnums_sql",
190 } elsif ( $search =~ /^\s*(\S.*\S)\s+\((.+), ([^,]+)\)\s*$/ ) {
192 my($company, $last, $first) = ( $1, $2, $3 );
194 # "Company (Last, First)"
195 #this is probably something a browser remembered,
196 #so just do an exact search (but case-insensitive, so USPS standardization
197 #doesn't throw a wrench in the works)
199 foreach my $prefix ( '', 'ship_' ) {
200 push @cust_main, qsearch( {
201 'table' => 'cust_main',
202 'hashref' => { %options },
204 ( keys(%options) ? ' AND ' : ' WHERE ' ).
206 " LOWER(${prefix}first) = ". dbh->quote(lc($first)),
207 " LOWER(${prefix}last) = ". dbh->quote(lc($last)),
208 " LOWER(${prefix}company) = ". dbh->quote(lc($company)),
214 } elsif ( $search =~ /^\s*(\S.*\S)\s*$/ ) { # value search
215 # try (ship_){last,company}
219 # # remove "(Last, First)" in "Company (Last, First)", otherwise the
220 # # full strings the browser remembers won't work
221 # $value =~ s/\([\w \,\.\-\']*\)$//; #false laziness w/Record::ut_name
223 use Lingua::EN::NameParse;
224 my $NameParse = new Lingua::EN::NameParse(
229 my($last, $first) = ( '', '' );
230 #maybe disable this too and just rely on NameParse?
231 if ( $value =~ /^(.+),\s*([^,]+)$/ ) { # Last, First
233 ($last, $first) = ( $1, $2 );
235 #} elsif ( $value =~ /^(.+)\s+(.+)$/ ) {
236 } elsif ( ! $NameParse->parse($value) ) {
238 my %name = $NameParse->components;
239 $first = $name{'given_name_1'} || $name{'initials_1'}; #wtf NameParse, Ed?
240 $last = $name{'surname_1'};
244 if ( $first && $last ) {
246 my($q_last, $q_first) = ( dbh->quote($last), dbh->quote($first) );
249 my $sql = scalar(keys %options) ? ' AND ' : ' WHERE ';
251 ( ( LOWER(last) = $q_last AND LOWER(first) = $q_first )
252 OR ( LOWER(ship_last) = $q_last AND LOWER(ship_first) = $q_first )
255 push @cust_main, qsearch( {
256 'table' => 'cust_main',
257 'hashref' => \%options,
258 'extra_sql' => "$sql AND $agentnums_sql", #agent virtualization
261 # or it just be something that was typed in... (try that in a sec)
265 my $q_value = dbh->quote($value);
268 my $sql = scalar(keys %options) ? ' AND ' : ' WHERE ';
269 $sql .= " ( LOWER(last) = $q_value
270 OR LOWER(company) = $q_value
271 OR LOWER(ship_last) = $q_value
272 OR LOWER(ship_company) = $q_value
274 $sql .= " OR LOWER(address1) = $q_value
275 OR LOWER(ship_address1) = $q_value
277 if $conf->exists('address1-search');
280 push @cust_main, qsearch( {
281 'table' => 'cust_main',
282 'hashref' => \%options,
283 'extra_sql' => "$sql AND $agentnums_sql", #agent virtualization
286 #no exact match, trying substring/fuzzy
287 #always do substring & fuzzy (unless they're explicity config'ed off)
288 #getting complaints searches are not returning enough
289 unless ( @cust_main && $skip_fuzzy || $conf->exists('disable-fuzzy') ) {
291 #still some false laziness w/search (was search/cust_main.cgi)
296 { 'company' => { op=>'ILIKE', value=>"%$value%" }, },
297 { 'ship_company' => { op=>'ILIKE', value=>"%$value%" }, },
300 if ( $first && $last ) {
303 { 'first' => { op=>'ILIKE', value=>"%$first%" },
304 'last' => { op=>'ILIKE', value=>"%$last%" },
306 { 'ship_first' => { op=>'ILIKE', value=>"%$first%" },
307 'ship_last' => { op=>'ILIKE', value=>"%$last%" },
314 { 'last' => { op=>'ILIKE', value=>"%$value%" }, },
315 { 'ship_last' => { op=>'ILIKE', value=>"%$value%" }, },
319 if ( $conf->exists('address1-search') ) {
321 { 'address1' => { op=>'ILIKE', value=>"%$value%" }, },
322 { 'ship_address1' => { op=>'ILIKE', value=>"%$value%" }, },
326 foreach my $hashref ( @hashrefs ) {
328 push @cust_main, qsearch( {
329 'table' => 'cust_main',
330 'hashref' => { %$hashref,
333 'extra_sql' => " AND $agentnums_sql", #agent virtualizaiton
342 " AND $agentnums_sql", #extra_sql #agent virtualization
345 if ( $first && $last ) {
346 push @cust_main, FS::cust_main::Search->fuzzy_search(
347 { 'last' => $last, #fuzzy hashref
348 'first' => $first }, #
352 foreach my $field ( 'last', 'company' ) {
354 FS::cust_main::Search->fuzzy_search( { $field => $value }, @fuzopts );
356 if ( $conf->exists('address1-search') ) {
358 FS::cust_main::Search->fuzzy_search( { 'address1' => $value }, @fuzopts );
365 #eliminate duplicates
367 @cust_main = grep { !$saw{$_->custnum}++ } @cust_main;
375 Accepts the following options: I<email>, the email address to search for. The
376 email address will be searched for as an email invoice destination and as an
379 #Any additional options are treated as an additional qualifier on the search
382 Returns a (possibly empty) array of FS::cust_main objects (but usually just
392 my $email = delete $options{'email'};
394 #we're only being used by RT at the moment... no agent virtualization yet
395 #my $agentnums_sql = $FS::CurrentUser::CurrentUser->agentnums_sql;
399 if ( $email =~ /([^@]+)\@([^@]+)/ ) {
401 my ( $user, $domain ) = ( $1, $2 );
403 warn "$me smart_search: searching for $user in domain $domain"
409 'table' => 'cust_main_invoice',
410 'hashref' => { 'dest' => $email },
417 map $_->cust_svc->cust_pkg,
419 'table' => 'svc_acct',
420 'hashref' => { 'username' => $user, },
422 'AND ( SELECT domain FROM svc_domain
423 WHERE svc_acct.domsvc = svc_domain.svcnum
424 ) = '. dbh->quote($domain),
430 @cust_main = grep { !$saw{$_->custnum}++ } @cust_main;
432 warn "$me smart_search: found ". scalar(@cust_main). " unique customers"
449 Returns a qsearch hash expression to search for parameters specified in
450 HASHREF. Valid parameters are
468 listref of start date, end date
478 =item current_balance
480 listref (list returned by FS::UI::Web::parse_lt_gt($cgi, 'current_balance'))
493 my ($class, $params) = @_;
500 # initialize these to prevent warnings
507 'paydate_year' => '',
508 'invoice_terms' => '',
514 # explicit custnum(s)
517 if ( $params->{'custnum'} ) {
518 my @custnums = ref($params->{'custnum'}) ?
519 @{ $params->{'custnum'} } :
520 $params->{'custnum'};
522 'cust_main.custnum IN (' .
523 join(',', map { $_ =~ /^(\d+)$/ ? $1 : () } @custnums ) .
524 ')' if scalar(@custnums) > 0;
531 if ( $params->{'agentnum'} =~ /^(\d+)$/ and $1 ) {
533 "cust_main.agentnum = $1";
537 # do the same for user
540 if ( $params->{'usernum'} =~ /^(\d+)$/ and $1 ) {
542 "cust_main.usernum = $1";
549 #prospect ordered active inactive suspended cancelled
550 if ( grep { $params->{'status'} eq $_ } FS::cust_main->statuses() ) {
551 my $method = $params->{'status'}. '_sql';
552 #push @where, $class->$method();
553 push @where, FS::cust_main->$method();
559 if ( $params->{'address'} =~ /\S/ ) {
560 my $address = dbh->quote('%'. lc($params->{'address'}). '%');
561 push @where, '('. join(' OR ',
562 map "LOWER($_) LIKE $address",
563 qw(address1 address2 ship_address1 ship_address2)
571 if ( $params->{'refnum'} =~ /^(\d+)$/ ) {
572 push @where, "refnum = $1";
576 # parse cancelled package checkbox
581 $pkgwhere .= "AND (cancel = 0 or cancel is null)"
582 unless $params->{'cancelled_pkgs'};
585 # parse without census tract checkbox
588 push @where, "(censustract = '' or censustract is null)"
589 if $params->{'no_censustract'};
592 # parse with hardcoded tax location checkbox
595 push @where, "geocode is not null"
596 if $params->{'with_geocode'};
602 foreach my $field (qw( signupdate )) {
604 next unless exists($params->{$field});
606 my($beginning, $ending, $hour) = @{$params->{$field}};
609 "cust_main.$field IS NOT NULL",
610 "cust_main.$field >= $beginning",
611 "cust_main.$field <= $ending";
614 if ($dbh->{Driver}->{Name} =~ /Pg/i) {
615 push @where, "extract(hour from to_timestamp(cust_main.$field)) = $hour";
617 elsif( $dbh->{Driver}->{Name} =~ /mysql/i) {
618 push @where, "hour(from_unixtime(cust_main.$field)) = $hour"
621 warn "search by time of day not supported on ".$dbh->{Driver}->{Name}." databases";
625 $orderby ||= "ORDER BY cust_main.$field";
633 if ( $params->{'classnum'} ) {
635 my @classnum = ref( $params->{'classnum'} )
636 ? @{ $params->{'classnum'} }
637 : ( $params->{'classnum'} );
639 @classnum = grep /^(\d*)$/, @classnum;
642 push @where, '( '. join(' OR ', map {
643 $_ ? "cust_main.classnum = $_"
644 : "cust_main.classnum IS NULL"
657 if ( $params->{'payby'} ) {
659 my @payby = ref( $params->{'payby'} )
660 ? @{ $params->{'payby'} }
661 : ( $params->{'payby'} );
663 @payby = grep /^([A-Z]{4})$/, @payby;
665 push @where, '( '. join(' OR ', map "cust_main.payby = '$_'", @payby). ' )'
671 # paydate_year / paydate_month
674 if ( $params->{'paydate_year'} =~ /^(\d{4})$/ ) {
676 $params->{'paydate_month'} =~ /^(\d\d?)$/
677 or die "paydate_year without paydate_month?";
681 'paydate IS NOT NULL',
683 "CAST(paydate AS timestamp) < CAST('$year-$month-01' AS timestamp )"
691 if ( $params->{'invoice_terms'} =~ /^([\w ]+)$/ ) {
693 if ( $1 eq 'NULL' ) {
695 "( cust_main.invoice_terms IS NULL OR cust_main.invoice_terms = '' )";
698 "cust_main.invoice_terms IS NOT NULL",
699 "cust_main.invoice_terms = '$1'";
707 if ( $params->{'current_balance'} ) {
709 #my $balance_sql = $class->balance_sql();
710 my $balance_sql = FS::cust_main->balance_sql();
712 my @current_balance =
713 ref( $params->{'current_balance'} )
714 ? @{ $params->{'current_balance'} }
715 : ( $params->{'current_balance'} );
717 push @where, map { s/current_balance/$balance_sql/; $_ }
726 if ( $params->{'custbatch'} =~ /^([\w\/\-\:\.]+)$/ and $1 ) {
728 "cust_main.custbatch = '$1'";
731 if ( $params->{'tagnum'} ) {
732 my @tagnums = ref( $params->{'tagnum'} ) ? @{ $params->{'tagnum'} } : ( $params->{'tagnum'} );
734 @tagnums = grep /^(\d+)$/, @tagnums;
737 my $tags_where = "0 < (select count(1) from cust_tag where "
738 . " cust_tag.custnum = cust_main.custnum and tagnum in ("
739 . join(',', @tagnums) . "))";
741 push @where, $tags_where;
747 # setup queries, subs, etc. for the search
750 $orderby ||= 'ORDER BY custnum';
752 # here is the agent virtualization
754 $FS::CurrentUser::CurrentUser->agentnums_sql(table => 'cust_main');
756 my $extra_sql = scalar(@where) ? ' WHERE '. join(' AND ', @where) : '';
760 my $count_query = "SELECT COUNT(*) FROM cust_main $extra_sql";
764 FS::UI::Web::cust_sql_fields($params->{'cust_fields'}),
767 my(@extra_headers) = ();
768 my(@extra_fields) = ();
770 if ($params->{'flattened_pkgs'}) {
774 if ($dbh->{Driver}->{Name} eq 'Pg') {
776 push @select, "array_to_string(array(select pkg from cust_pkg left join part_pkg using ( pkgpart ) where cust_main.custnum = cust_pkg.custnum $pkgwhere),'|') as magic";
778 } elsif ($dbh->{Driver}->{Name} =~ /^mysql/i) {
779 push @select, "GROUP_CONCAT(part_pkg.pkg SEPARATOR '|') as magic";
780 $addl_from .= ' LEFT JOIN cust_pkg USING ( custnum ) '; #Pg too w/flatpkg?
781 $addl_from .= ' LEFT JOIN part_pkg USING ( pkgpart ) ';
782 #$pkg_join .= ' LEFT JOIN part_pkg USING ( pkgpart ) ';
784 warn "warning: unknown database type ". $dbh->{Driver}->{Name}.
785 "omitting packing information from report.";
788 my $header_query = "SELECT COUNT(cust_pkg.custnum = cust_main.custnum) AS count FROM cust_main $addl_from $extra_sql $pkgwhere group by cust_main.custnum order by count desc limit 1";
790 my $sth = dbh->prepare($header_query) or die dbh->errstr;
791 $sth->execute() or die $sth->errstr;
792 my $headerrow = $sth->fetchrow_arrayref;
793 my $headercount = $headerrow ? $headerrow->[0] : 0;
794 while($headercount) {
795 unshift @extra_headers, "Package ". $headercount;
796 unshift @extra_fields, eval q!sub {my $c = shift;
797 my @a = split '\|', $c->magic;
798 my $p = $a[!.--$headercount. q!];
805 if ( $params->{'with_geocode'} ) {
807 unshift @extra_headers, 'Tax location override', 'Calculated tax location';
808 unshift @extra_fields, sub { my $c = shift; $c->get('geocode'); },
810 $c->set('geocode', '');
811 $c->geocode('cch'); #XXX only cch right now
813 push @select, 'geocode';
814 push @select, 'zip' unless grep { $_ eq 'zip' } @select;
815 push @select, 'ship_zip' unless grep { $_ eq 'ship_zip' } @select;
818 my $select = join(', ', @select);
821 'table' => 'cust_main',
823 'addl_from' => $addl_from,
825 'extra_sql' => $extra_sql,
826 'order_by' => $orderby,
827 'count_query' => $count_query,
828 'extra_headers' => \@extra_headers,
829 'extra_fields' => \@extra_fields,
834 =item fuzzy_search FUZZY_HASHREF [ HASHREF, SELECT, EXTRA_SQL, CACHE_OBJ ]
836 Performs a fuzzy (approximate) search and returns the matching FS::cust_main
837 records. Currently, I<first>, I<last>, I<company> and/or I<address1> may be
838 specified (the appropriate ship_ field is also searched).
840 Additional options are the same as FS::Record::qsearch
845 my( $self, $fuzzy, $hash, @opt) = @_;
850 check_and_rebuild_fuzzyfiles();
851 foreach my $field ( keys %$fuzzy ) {
853 my $all = $self->all_X($field);
854 next unless scalar(@$all);
857 $match{$_}=1 foreach ( amatch( $fuzzy->{$field}, ['i'], @$all ) );
860 foreach ( keys %match ) {
861 push @fcust, qsearch('cust_main', { %$hash, $field=>$_}, @opt);
862 push @fcust, qsearch('cust_main', { %$hash, "ship_$field"=>$_}, @opt);
865 push @cust_main, grep { ! $fsaw{$_->custnum}++ } @fcust;
868 # we want the components of $fuzzy ANDed, not ORed, but still don't want dupes
870 @cust_main = grep { ++$saw{$_->custnum} == scalar(keys %$fuzzy) } @cust_main;
878 =head1 UTILITY SUBROUTINES
882 =item check_and_rebuild_fuzzyfiles
886 sub check_and_rebuild_fuzzyfiles {
887 my $dir = $FS::UID::conf_dir. "/cache.". $FS::UID::datasrc;
888 rebuild_fuzzyfiles() if grep { ! -e "$dir/cust_main.$_" } @fuzzyfields;
891 =item rebuild_fuzzyfiles
895 sub rebuild_fuzzyfiles {
897 use Fcntl qw(:flock);
899 my $dir = $FS::UID::conf_dir. "/cache.". $FS::UID::datasrc;
900 mkdir $dir, 0700 unless -d $dir;
902 foreach my $fuzzy ( @fuzzyfields ) {
904 open(LOCK,">>$dir/cust_main.$fuzzy")
905 or die "can't open $dir/cust_main.$fuzzy: $!";
907 or die "can't lock $dir/cust_main.$fuzzy: $!";
909 open (CACHE, '>:encoding(UTF-8)', "$dir/cust_main.$fuzzy.tmp")
910 or die "can't open $dir/cust_main.$fuzzy.tmp: $!";
912 foreach my $field ( $fuzzy, "ship_$fuzzy" ) {
913 my $sth = dbh->prepare("SELECT $field FROM cust_main".
914 " WHERE $field != '' AND $field IS NOT NULL");
915 $sth->execute or die $sth->errstr;
917 while ( my $row = $sth->fetchrow_arrayref ) {
918 print CACHE $row->[0]. "\n";
923 close CACHE or die "can't close $dir/cust_main.$fuzzy.tmp: $!";
925 rename "$dir/cust_main.$fuzzy.tmp", "$dir/cust_main.$fuzzy";
931 =item append_fuzzyfiles FIRSTNAME LASTNAME COMPANY ADDRESS1
935 sub append_fuzzyfiles {
936 #my( $first, $last, $company ) = @_;
938 check_and_rebuild_fuzzyfiles();
940 use Fcntl qw(:flock);
942 my $dir = $FS::UID::conf_dir. "/cache.". $FS::UID::datasrc;
944 foreach my $field (@fuzzyfields) {
949 open(CACHE, '>>:encoding(UTF-8)', "$dir/cust_main.$field" )
950 or die "can't open $dir/cust_main.$field: $!";
952 or die "can't lock $dir/cust_main.$field: $!";
954 print CACHE "$value\n";
957 or die "can't unlock $dir/cust_main.$field: $!";
971 my( $self, $field ) = @_;
972 my $dir = $FS::UID::conf_dir. "/cache.". $FS::UID::datasrc;
973 open(CACHE, '<:encoding(UTF-8)', "$dir/cust_main.$field")
974 or die "can't open $dir/cust_main.$field: $!";
975 my @array = map { chomp; $_; } <CACHE>;
986 L<FS::cust_main>, L<FS::Record>