query("SET NAMES 'utf8';"); return $db; } // --------------------------------------------------------------------------- // // println // --------------------------------------------------------------------------- // function println($ln = '') { print $ln.'
'; } // --------------------------------------------------------------------------- // // debugln // --------------------------------------------------------------------------- // if (DEBUG) { function debugln($ln = '') { print $ln.'
'; } } else if (LOCAL) { function debugln($ln = '') {} } else { function debugln($ln = '') { /* $fp = fopen(LOG_PATH.'/recherchesDebug.log', 'a'); fwrite($fp, $ln."\n"); fclose($fp); */ } } // --------------------------------------------------------------------------- // // Nouvelle sequence // --------------------------------------------------------------------------- // function nouvelleSequence(&$criteres) { $sequence = array( array( 'crit' => 'IT ', 'next' => '12' ), array( 'crit' => 'I ', 'next' => '00' ), array( 'crit' => 'I SEP ', 'next' => '12' ), array( 'crit' => ' T ', 'next' => '00' ), array( 'crit' => ' TSEP ', 'next' => '13 61 61o61p' ), array( 'crit' => ' D VNR', 'next' => '24 45o24o24p' ), array( 'crit' => ' D NR', 'next' => '21o21p' ), array( 'crit' => ' DL NR', 'next' => '21 21o21p' ), array( 'crit' => ' DLVNR', 'next' => '36 45 24 45o24o24p' ), array( 'crit' => ' P VNR', 'next' => '74 78o74o74p' ), array( 'crit' => ' PD VNR', 'next' => '74 78o74o74p' ), array( 'crit' => ' PDL NR', 'next' => '78 83o74 74o74p' ), array( 'crit' => ' PDLV R', 'next' => '78 81 82 77 71' ), array( 'crit' => ' PDLVN ', 'next' => '82 75 28 71' ), array( 'crit' => ' PDLVNR', 'next' => '78 74 82 78o74o82o82p' ), array( 'crit' => ' S ', 'next' => '30o30p' ), array( 'crit' => ' S R', 'next' => '72o71 71o71p' ), array( 'crit' => ' S N ', 'next' => '31' ), array( 'crit' => ' S NR', 'next' => '77 43 71' ), array( 'crit' => ' S V ', 'next' => '35o35p30' ), array( 'crit' => ' S VN ', 'next' => '75 77o75o77p75p' ), array( 'crit' => ' S V R', 'next' => '75 83' ), array( 'crit' => ' S VNR', 'next' => '43 44 75 83 61 71' ), array( 'crit' => ' S D ', 'next' => '40p40o61p61' ), array( 'crit' => ' S D R', 'next' => '45o77 77o77p' ), array( 'crit' => ' S D N ', 'next' => '71' ), array( 'crit' => ' S D NR', 'next' => '77 43 71 31' ), array( 'crit' => ' S D V ', 'next' => '77o40 40o' ), array( 'crit' => ' S D V R', 'next' => '75 72 71' ), array( 'crit' => ' S D VN ', 'next' => '43 41 77 71' ), array( 'crit' => ' S D VNR', 'next' => '44 43 49 73 75 72 71' ), array( 'crit' => ' S DL ', 'next' => '78 78p61p61p' ), array( 'crit' => ' S DL R', 'next' => '82 78 77 71' ), array( 'crit' => ' S DL N ', 'next' => '41 71' ), array( 'crit' => ' S DL NR', 'next' => '78 82 81 78p77 43 71 31' ), array( 'crit' => ' S DLV ', 'next' => '78 78p71' ), array( 'crit' => ' S DLV R', 'next' => '78 83 82 75 72 40 71' ), array( 'crit' => ' S DLVN ', 'next' => '78 82 78p43 71' ), array( 'crit' => ' S DLVNR', 'next' => '78 49 77 43 78p75 41 72 71 22' ), array( 'crit' => ' S P ', 'next' => '60o60p31 31o31p' ), array( 'crit' => ' S P R', 'next' => '45 77 41' ), array( 'crit' => ' S P N ', 'next' => '71 71o45 45p' ), array( 'crit' => ' S P NR', 'next' => '77 72 33 32' ), array( 'crit' => ' S P V ', 'next' => '63o45 45o45p' ), array( 'crit' => ' S P VN ', 'next' => '45 43 61 64' ), array( 'crit' => ' S P V R', 'next' => '75 83 45 35' ), array( 'crit' => ' S P VNR', 'next' => '77 45 44 43 73 75 72 71 41 42 40' ), array( 'crit' => ' S PD ', 'next' => '45 71p71o' ), array( 'crit' => ' S PD R', 'next' => '77 45 71' ), array( 'crit' => ' S PD N ', 'next' => '71 71o45 45o' ), array( 'crit' => ' S PD NR', 'next' => '77 76 45 41 43 40' ), array( 'crit' => ' S PD V ', 'next' => '45 45o71 42 42p' ), array( 'crit' => ' S PD V R', 'next' => '77 83 43 71 41' ), array( 'crit' => ' S PD VN ', 'next' => '83 75 71 44 83o75o71o44o43 41 40 40o40p' ), array( 'crit' => ' S PD VNR', 'next' => '77 74 45 44 43 75 71 61 63 60 40' ), array( 'crit' => ' S PDL ', 'next' => '71 71o71p45 45o' ), array( 'crit' => ' S PDL R', 'next' => '78 82 75 45 44' ), array( 'crit' => ' S PDL N ', 'next' => '73 48 41' ), array( 'crit' => ' S PDL NR', 'next' => '78 82 81 49 77 65 44 43 75 60 31' ), array( 'crit' => ' S PDLV ', 'next' => '78 45 45o71 42 42p40' ), array( 'crit' => ' S PDLV R', 'next' => '78 83 82 75 45 49 46 42 71 40' ), array( 'crit' => ' S PDLVN ', 'next' => '78 83 77 45 71 42 41 40' ), array( 'crit' => ' S PDLVNR', 'next' => '78 83 27 74 45 44 43 42 40' ), array( 'crit' => ' SE ', 'next' => '31o31p' ), array( 'crit' => ' SE R', 'next' => '72o71 71o71p' ), array( 'crit' => ' SE N ', 'next' => '31' ), array( 'crit' => ' SE NR', 'next' => '77 43 71' ), array( 'crit' => ' SE V ', 'next' => '35o35p30' ), array( 'crit' => ' SE V R', 'next' => '75 83' ), array( 'crit' => ' SE VN ', 'next' => '75 77' ), array( 'crit' => ' SE VNR', 'next' => '43 44 75 83 61 71' ), array( 'crit' => ' SE D ', 'next' => '40o30' ), array( 'crit' => ' SE D R', 'next' => '45o77' ), array( 'crit' => ' SE D N ', 'next' => '71' ), array( 'crit' => ' SE D NR', 'next' => '77 43 71 31' ), array( 'crit' => ' SE D V ', 'next' => '77o40' ), array( 'crit' => ' SE D V R', 'next' => '75 72 71' ), array( 'crit' => ' SE D VN ', 'next' => '43 41 77' ), array( 'crit' => ' SE D VNR', 'next' => '44 43 49 73 75 72 71' ), array( 'crit' => ' SE DL ', 'next' => '40' ), array( 'crit' => ' SE DL R', 'next' => '82 78 77' ), array( 'crit' => ' SE DL N ', 'next' => '45 43 82o45o43o43p' ), array( 'crit' => ' SE DL NR', 'next' => '78 82 81 46 77 43 71 31' ), array( 'crit' => ' SE DLV ', 'next' => '78 78o71 71o71p' ), array( 'crit' => ' SE DLV R', 'next' => '78 83 82 75 72 40' ), array( 'crit' => ' SE DLVN ', 'next' => '78 82 46 43 71' ), array( 'crit' => ' SE DLVNR', 'next' => '78 49 77 43 46 75 41 72 71 22' ), array( 'crit' => ' SEP ', 'next' => '61p31 31p30' ), array( 'crit' => ' SEP R', 'next' => '45 77 41' ), array( 'crit' => ' SEP N ', 'next' => '71 71o45 45p' ), array( 'crit' => ' SEP NR', 'next' => '77 72 33 32' ), array( 'crit' => ' SEP V ', 'next' => '63o45' ), array( 'crit' => ' SEP V R', 'next' => '75 83 45 35' ), array( 'crit' => ' SEP VN ', 'next' => '45 43 61 64' ), array( 'crit' => ' SEP VNR', 'next' => '77 45 44 43 73 75 72 71 41 42 40' ), array( 'crit' => ' SEPD ', 'next' => '45 71p' ), array( 'crit' => ' SEPD R', 'next' => '77 45' ), array( 'crit' => ' SEPD N ', 'next' => '71 71o45 40' ), array( 'crit' => ' SEPD NR', 'next' => '77 76 45 41 43 40' ), array( 'crit' => ' SEPD V ', 'next' => '45 71p71o40' ), array( 'crit' => ' SEPD V R', 'next' => '77 83 43 71 41 40' ), array( 'crit' => ' SEPD VN ', 'next' => '83 75 71 44 83o75o71o44o43 41 40 40o40p' ), array( 'crit' => ' SEPD VNR', 'next' => '77 74 45 44 43 75 71 61 63 60 40' ), array( 'crit' => ' SEPDL ', 'next' => '45 71p40' ), array( 'crit' => ' SEPDL R', 'next' => '78 82 75 45 44 40' ), array( 'crit' => ' SEPDL N ', 'next' => '73 48 41 40' ), array( 'crit' => ' SEPDL NR', 'next' => '78 82 81 49 77 65 44 43 75 60 31' ), array( 'crit' => ' SEPDLV ', 'next' => '78 45 45o71 42 42p' ), array( 'crit' => ' SEPDLV R', 'next' => '78 83 82 75 45 49 46 42 71 40' ), array( 'crit' => ' SEPDLVN ', 'next' => '78 83 77 45 71 42 41 40' ), array( 'crit' => ' SEPDLVNR', 'next' => '78 83 27 74 45 44 43 42 40' ), ); foreach ($sequence as $ligne) { if (strstr($ligne['crit'], $criteres) != false) { return str_split($ligne['next'], 3); } } return array(); } // --------------------------------------------------------------------------- // // Nouvelle combinaison // --------------------------------------------------------------------------- // function nouvelleCombinaison(&$sequence, &$sequencePos, $pass, &$index, &$mode) { for (;;) { if (isset($sequence[$sequencePos]) === false) { return ''; } $combinaison = trim($sequence[$sequencePos]); ++$sequencePos; if (strlen($combinaison) == 2) { return $combinaison; } // Passage en phonetique ou en orthographique if (strlen($combinaison) == 3) { if ($pass == 2 || $pass == 3) { continue; } $car = strtolower(substr($combinaison, 2, 1)); //Search Engine Version 2, we remove the orthographique if (SPHINX_ENT_VERSION == 2 && $car == 'o') { return strtolower(substr($combinaison, 0, 2)); } switch($car) { case 'p': $index = 'ent_phx'; $mode = SPH_MATCH_EXTENDED2; break; case 'o': $index = 'ent_mns'; $mode = SPH_MATCH_ISPELL; break; default: debugln("attention: mode inconnu: '$car'"); } } else if ($pass == 1) { $index = 'ent_mns'; //Search Engine Version 2, we remove the orthographique if (SPHINX_ENT_VERSION == 2) { $index = 'ent'; } } return $combinaison; } } // --------------------------------------------------------------------------- // // Nouveaux criteres // --------------------------------------------------------------------------- // function nouveauxCriteres($comb2crit, $combinaison) { if ( array_key_exists($combinaison, $comb2crit) ) { $ligne = $comb2crit[$combinaison]; return $ligne; } return ''; } // --------------------------------------------------------------------------- // // Filtre les caracteres speciaux // --------------------------------------------------------------------------- // function filtreCaracteresSpeciaux(&$formR) { foreach ($formR as $label => $valeur) { if (empty($valeur) == true) { continue; } $search = array('@', '\'', '/'); $replace = array('a', ' ', ' '); $formR[$label] = str_replace($search, $replace, $valeur); } } // --------------------------------------------------------------------------- // // Filtre pour le siren // --------------------------------------------------------------------------- // function filtreSiret(&$formR, &$criteres, &$sphinx) { if (empty($formR['siret']) == true) { return; } if (strstr($criteres, 'I') != false) { if (preg_match('/[0-9]{9}/', $formR['siret'], $arraySiren) > 0) { debugln("filtre siren='$arraySiren[0]'"); $sphinx->SetFilter('siren', $arraySiren); } else if (preg_match('/[0-9]{5}/', $formR['siret'], $arrayNic) > 0) { debugln("filtre nic='$arrayNic[0]'"); $sphinx->SetFilter('nic', $arrayNic); } } } // --------------------------------------------------------------------------- // // Filtre pour les elements de l'adresse // --------------------------------------------------------------------------- // function filtreAdresse(&$formR, &$criteres, &$sphinx) { $gDatabaseJO = databaseJO(); if (empty($formR['cpVille']) == true) { return; } $adressePostale = $formR['cpVille']; //If we have a CEDEX if (preg_match('/^[0-9]{5}\s(.*)\sCEDEX/i', $adressePostale, $codePostaux)) { $formR['departement'] = ''; $formR['ville'] = $codePostaux[1]; } //If we have a Code Postal elseif (preg_match('/[0-9]{5}/', $adressePostale, $codePostaux) > 0) { if (strstr($criteres, 'L') != false) { debugln("filtre adr_cp='$codePostaux[0]'"); $sphinx->SetFilter('adr_cp', $codePostaux); } else if (strstr($criteres, 'D') != false) { $departement = substr($codePostaux[0], 0, 2); if ($departement == 97 || $departement == 98) { $departement = substr($codePostaux[0], 0, 3); } debugln("filtre adr_dep='$departement'"); $sphinx->SetFilter('adr_dep', array($departement)); } $formR['ville'] = str_replace($codePostaux[0], '', $adressePostale); $dep = intval(substr($codePostaux[0], 0, 2)); //Monaco if ($codePostaux[0] == '98000') { $formR['departement'] = 99; $formR['localite'] = 0; //DOM-TOM } else if ($dep == 97 || $dep == 98) { $formR['departement'] = substr($codePostaux[0], 0, 3); $formR['localite'] = substr($codePostaux[0], 3, 2); } else { $formR['departement'] = substr($codePostaux[0], 0, 2); $formR['localite'] = substr($codePostaux[0], 2, 3); } } //If we have a Departement else if (preg_match('/(2[A|B]|[0-9]{2})/', $adressePostale, $departements) || preg_match('/([0-9]{3})/', $adressePostale, $departements)) { $departement = $departements[1]; if ($departement == '2A'){ $departement = 201; } if ($departement == '2B' ) { $departement = 202; } if (strstr($criteres, 'D') != false) { debugln("filtre adr_dep='$departement'"); $sphinx->SetFilter('adr_dep', array($departement)); } $formR['ville'] = str_replace($departement, '', $adressePostale); $formR['departement'] = $departement; } else { $formR['ville'] = $adressePostale; } // Completion if (isset($formR['ville']) == true && isset($formR['localite']) == false) { $ville = strtoupper(trim($formR['ville'])); if ($ville == 'PARIS') { $formR['departement'] = 75; return; } if ($ville == 'LYON') { $formR['departement'] = 69; return; } if ($ville == 'MARSEILLE') { $formR['departement'] = 13; return; } $requeteDB = "select * from communes where LibCom like '$ville'"; debugln($requeteDB); $resDB = $gDatabaseJO->query($requeteDB); if ($resDB->num_rows == 1) { $cp = $resDB->fetch_assoc(); $cp = $cp['Code Postal']; $formR['departement'] = substr($cp, 0, 2); if ($formR['departement'] == '97' || $formR['departement'] == '98') { $formR['departement'] = substr($cp, 0, 3); $formR['localite'] = substr($cp, 3, 2); } else { $formR['localite'] = substr($cp, 2, 3); } if (DEBUG) { print 'Completion: '.$formR['ville'].' '. $formR['departement'].$formR['localite'].'
'; } } // TODO: // On peut ameliorer avec le departement si plusieurs resultats // ou tronquer la ville si aucun resultat } } // --------------------------------------------------------------------------- // // Filtre pour le numero de la voie // --------------------------------------------------------------------------- // function filtreNumero(&$formR, &$criteres, &$sphinx) { if (empty($formR['numVoie']) == false) { if (strstr($criteres, 'N') != false) { debugln("filtre adr_num='$formR[numVoie]'"); $sphinx->SetFilter('adr_num', array($formR['numVoie'])); } } } // --------------------------------------------------------------------------- // // Filtre pour la date de naissance // --------------------------------------------------------------------------- // function filtreDateNaiss(&$formR, &$criteres, &$sphinx) { $jj = preg_replace('/[^0-9]/', '', $formR['dirDateNaissJJ']); if ($jj < 0 || $jj > 31) { //echo ('Jour de naissance incorrect !'); } $mm = preg_replace('/[^0-9]/', '', $formR['dirDateNaissMM']); if ($mm < 0 || $mm > 12) { //echo ('Mois de naissance incorrect !'); } $aa = preg_replace('/[^0-9]/', '', $formR['dirDateNaissAAAA']); $annee = date('Y') - 18; if ($aa < 0 || $aa > $annee) { //echo ('Année de naissance incorrecte !'); } if (empty($jj) == false && strstr($criteres, 'J') != false) { debugln("filtre naiss_jour='$jj'"); $sphinx->SetFilter('naiss_jour', array($jj)); } if (empty($mm) == false && strstr($criteres, 'M') != false) { debugln("filtre naiss_jour='$mm'"); $sphinx->SetFilter('naiss_mois', array($mm)); } if (empty($aa) == false) { if (strstr($criteres, 'A') != false) { debugln("filtre naiss_jour='$aa'"); $sphinx->SetFilter('naiss_annee', array($aa)); } else if (strstr($criteres, 'R') != false) { debugln("filtre naiss_jour='".($aa-5).'-'.($aa+5)."'"); $sphinx->SetFilterRange('naiss_annee', $aa - 5, $aa + 5); } } } //Filtre sur les actifs function filtreActif(&$formR, &$criteres, &$sphinx) { if ( array_key_exists('actif', $formR) && in_array($formR['actif'], array(0,1)) ) { $sphinx->setFilter('actif', array($formR['actif'])); } } //Filtre sur les sieges function filtreSiege(&$formR, &$criteres, &$sphinx) { if ( array_key_exists('siege', $formR) && $formR['siege']==1 ) { $sphinx->setFilter('siege', array(1)); } } //Filtre forme juridique function filtreFormeJuridique(&$formR, &$criteres, &$sphinx) { if ( array_key_exists('fj', $formR) && $formR['fj']!==null ) { $sphinx->setFilter('cj', array(intval($formR['fj']))); } } // --------------------------------------------------------------------------- // // Premiere requete Sphinx // --------------------------------------------------------------------------- // // Premiere requete sans la gestion des mots non significatifs // et avec concatenation de tous les mots de la raison sociale // --------------------------------------------------------------------------- // function premiereRequeteSphinx(&$sphinx, &$index, &$formR, &$criteres, &$criteresSphinx, &$form2crit, $sirenValide) { filtreSiege($formR, $criteres, $sphinx); filtreActif($formR, $criteres, $sphinx); filtreFormeJuridique($formR, $criteres, $sphinx); filtreSiret ($formR, $criteres, $sphinx); filtreAdresse($formR, $criteres, $sphinx); filtreNumero ($formR, $criteres, $sphinx); if ($sirenValide == true) { $sphinx->SetFilter('sirenValide', array(1)); } $requete_sphinx = ''; foreach ($formR as $label => $valeur) { if ($label == 'naf' && empty($valeur) == false) { $requete_sphinx .= '@ape_etab '.$valeur.' '; } else if (empty($valeur) == false && isset($criteresSphinx[$label]) == true && strstr($criteres, $form2crit[$label]) != false) { if ($label == 'raisonSociale') { $sans_espace = str_replace(' ', '', $valeur); if ($sans_espace != $valeur) { if (strstr($valeur, '"') == false) { $valeur = '"'.$valeur.'"'; } $valeur = '('.$sans_espace.' | '.$valeur.'~2)'; } else if (strstr($valeur, '"') == false) { $valeur = '"'.$valeur.'"'; } } $requete_sphinx .= $criteresSphinx[$label].' '.$valeur.' '; } } debugln("requete='$requete_sphinx'"); if (substr($index, 0, 3) == 'ent') { $sphinx->SetSortMode(SPH_SORT_EXTENDED,'sirenValide DESC, actif DESC, siege DESC, rang DESC'); } else if (substr($index, 0, 3) == 'dir') { $sphinx->SetSortMode(SPH_SORT_EXTENDED, 'actif DESC'); } return $sphinx->Query($requete_sphinx, $index); } // --------------------------------------------------------------------------- // // Requete Sphinx // --------------------------------------------------------------------------- // function requeteSphinx(&$sphinx, &$index, &$formR, &$criteres, &$criteresSphinx, &$form2crit, $quorum_actif, $quorum, $sirenValide) { filtreSiege($formR, $criteres, $sphinx); filtreActif($formR, $criteres, $sphinx); filtreFormeJuridique($formR, $criteres, $sphinx); filtreSiret ($formR, $criteres, $sphinx); filtreAdresse($formR, $criteres, $sphinx); filtreNumero ($formR, $criteres, $sphinx); if ($sirenValide == true) { $sphinx->SetFilter('sirenValide', array(1)); } if ($quorum_actif == true) { foreach ($quorum as $label => $valeur) { if ($valeur > 1 && strstr($formR[$label], '"') == false) { $formR[$label] = '"'.$formR[$label].'"/'.($valeur-1); } } } $requete_sphinx = ''; foreach ($formR as $label => $valeur) { if ($label == 'naf' && empty($valeur) == false) { $requete_sphinx .= '@ape_etab '.$valeur.' '; } else if (empty($valeur) == false && isset($criteresSphinx[$label]) == true && strstr($criteres, $form2crit[$label]) != false) { $requete_sphinx .= $criteresSphinx[$label].' '.$valeur.' '; } } debugln("requete='$requete_sphinx'"); if (substr($index, 0, 3) == 'ent') { $sphinx->SetSortMode(SPH_SORT_EXTENDED,'sirenValide DESC, rang DESC, actif DESC, siege DESC'); } else if (substr($index, 0, 3) == 'dir') { $sphinx->SetSortMode(SPH_SORT_EXTENDED, 'actif DESC'); } return $sphinx->Query($requete_sphinx, $index); } // --------------------------------------------------------------------------- // // Criteres de depart // --------------------------------------------------------------------------- // function criteresDeDepart(&$formR, &$form2crit) { $criteres = ''; foreach ($form2crit as $label => $valeur) { if (empty($formR[$label]) == false) { if ($valeur == 'I') { // Dans ce cas on ne garde que le siren return 'I '; } $criteres .= $valeur; } else { $criteres .= ' '; } } return $criteres; } // --------------------------------------------------------------------------- // // Affichage du status de Sphinx // --------------------------------------------------------------------------- // function afficheStatusSphinx(&$sphinx, &$resSphinx) { if (DEBUG) { if ($resSphinx == false) { println('Query failed: '.$sphinx->GetLastError().'.'); return; } if ($sphinx->GetLastWarning()) { println('WARNING: '.$sphinx->GetLastWarning()); } println("Query retrieved $resSphinx[total]". " of $resSphinx[total_found] matches in $resSphinx[time] sec."); println('Query stats:'); if (isset ($resSphinx['words']) && is_array($resSphinx['words'])) { foreach ($resSphinx['words'] as $word => $info) { println(" '$word' found $info[hits] times". " in $info[docs] documents"); } println(''); } } } // --------------------------------------------------------------------------- // // Affichage des donnees en base // --------------------------------------------------------------------------- // function afficheDB(&$resSphinx, &$formR, &$form2crit, $table, &$base2form, $deb, $nbRep) { $gDatabaseJO = databaseJO(); if (isset($resSphinx['matches']) == false) { println('Aucun résultat'); return; } if ($formR['type'] == 'ent') { $requeteDB = "select *, (siren>200) AS sirenValide"; } else { $requeteDB = "select *"; } $requeteDB .= " from $table where id=".$resSphinx['matches'][0]['id']; for ($i = 1; $i + $deb < $resSphinx['total'] && $i < $nbRep; ++$i) { $requeteDB .= ' or id='.$resSphinx['matches'][$i]['id']; } if ($formR['type'] == 'ent') { $requeteDB .= ' ORDER BY sirenValide DESC, actif DESC, siege DESC, rang DESC'; } else { $requeteDB .= ' ORDER BY actif DESC'; } $requeteDB .= ' limit 0, '.$nbRep; debugln("requeteDB='$requeteDB'"); $resDB = $gDatabaseJO->query($requeteDB); $nb_res = $resDB->num_rows; for ($i = 0; $i < $nb_res; ++$i) { $ligne = $resDB->fetch_assoc(); println(); foreach ($base2form as $label => $valeur) { if (empty($formR[$valeur]) == false) { print "$form2crit[$valeur]='$ligne[$label]' "; } else { print "$form2crit[$valeur]='$ligne[$label]' "; } } } println(); } // --------------------------------------------------------------------------- // // Nombre de mots trouves dans un champ // --------------------------------------------------------------------------- // function nombreDeMots(&$res, $champ) { if (isset($res['words']) == false) { return 0; } $champ = preg_replace('/[^A-Za-z]/', ' ', $champ); $mot = explode(' ', strtolower($champ)); $n = 0; $nul = 0; foreach ($mot as $m) { if (isset($res['words'][$m]) == true) { debugln('nombre de mots: '. $m.' => '.$res['words'][$m]['hits']); if ($res['words'][$m]['hits'] == 0) { ++$nul; } ++$n; } } if ($nul > 2) { return $n - $nul + 1; } else { return $n; } } // --------------------------------------------------------------------------- // // changePass // --------------------------------------------------------------------------- // // mode et index doivent etre positionnes a chaque fois // --------------------------------------------------------------------------- // function changePass(&$pass, &$mode, &$index, &$quorumActif, &$formR) { switch ($pass) { case 1: // Pass 2 : Phonex $pass = 2; $mode = SPH_MATCH_EXTENDED; $index = 'ent_phx'; return true; case 2: // Pass 3 : Ispell $pass = 3; $mode = SPH_MATCH_EXTENDED; $index = 'ent_mns'; if (SPHINX_ENT_VERSION == 2) { $index = 'ent'; } return true; case 3: // Pass 4 : Quorum n-1 $pass = 4; $mode = SPH_MATCH_EXTENDED; $index = 'ent_mns'; if (SPHINX_ENT_VERSION == 2) { $index = 'ent'; } $quorumActif = true; return true; case 4: // Pass 5 : Quorum n-2 $pass = 5; foreach ($formR as $label => $valeur) { if (preg_match('@.*"/[1-9]+@', $valeur) != false) { $n = preg_replace('@.*"/([1-9]+).*@', '$1', $valeur); if ($n > 1) { $formR[$label] = str_replace($n, $n - 1, $valeur); } } } return true; default: return false; } } // --------------------------------------------------------------------------- // // initSphinx // --------------------------------------------------------------------------- // function initSphinx(&$sphinx, $mode, $pass, $deb, $nbRep, $max) { debugln(); debugln('pass '.$pass); debugln(); $sphinx->SetMatchMode($mode); $sphinx->resetFilters(); $sphinx->SetLimits(intval($deb), intval($nbRep), intval($max)); } // --------------------------------------------------------------------------- // // Criteres recherche par dirigeant // --------------------------------------------------------------------------- // function criteresDir($c, &$index) { if (substr($c, strlen($c) - 1, 1) == 'p') { $c = substr($c, 0, strlen($c) - 1); $index = 'dir'; } else { $index = 'dir_phx'; return $c.'p'; } $tab = array('NPAMJDV' => 'NPAM DV', 'NPAM DV' => 'NPA DV', 'NPA DV' => 'NPR DV', 'NPR DV' => 'NP DV', 'NP DV' => 'NPAMJD ', 'NPAMJD ' => 'NPAMJ ', 'NPAMJ ' => 'N AMJDV', 'N AMJDV' => 'N AM DV', 'N AM DV' => 'N A DV', 'N A DV' => 'N R DV', 'N R DV' => 'N DV', 'N DV' => 'N AMJD ', 'N AMJD ' => 'N AMJ ', 'N AMJ ' => ' PAMJDV', ' PAMJDV' => ' PAM DV', ' PAM DV' => ' PA DV', ' PA DV' => ' PR DV', ' PR DV' => ' P DV', ' P DV' => ' PAMJD ', ' PAMJD ' => ' PAMJ ', ' PAMJ ' => ' PAM '); if (isset($tab[$c]) == true) { $ret = $tab[$c]; } else { $ret = ''; } return $ret; } // --------------------------------------------------------------------------- // // clientSphinx // --------------------------------------------------------------------------- // function clientSphinx(&$formR) { // Formulaire $formulaire_vide = true; foreach ($formR as $label => $valeur) { if ($label != 'type' && // Ce champs ne devrait pas etre dans formR empty($valeur) == false) { $formulaire_vide = false; $formR[$label] = trim($valeur); } } if ($formulaire_vide == true) { return false; } if (DEBUG) { foreach ($formR as $label => $valeur) { println("$label = '$valeur'"); } } switch($formR['type']) { case 'ent': $host = SPHINX_ENT_HOST; $port = SPHINX_ENT_PORT; $version = defined('SPHINX_ENT_VERSION') ? SPHINX_ENT_VERSION : 1; break; case 'dir': $version = defined('SPHINX_DIR_VERSION') ? SPHINX_DIR_VERSION : 1; $host = SPHINX_DIR_HOST; $port = SPHINX_DIR_PORT; break; case 'histo': $version = defined('SPHINX_HISTO_VERSION') ? SPHINX_HISTO_VERSION : 1; $host = SPHINX_HISTO_HOST; $port = SPHINX_HISTO_PORT; break; case 'act': $version = defined('SPHINX_ACT_VERSION') ? SPHINX_ACT_VERSION : 1; $host = SPHINX_ACT_HOST; $port = SPHINX_ACT_PORT; break; } switch ( $version ) { case 1: require_once 'SphinxSearch/sphinxapi-0.9.9.php'; break; case 2: require_once 'SphinxSearch/sphinxapi-2.2.9.php'; break; } // Client Sphinx $sphinx = new SphinxClient(); $sphinx->SetServer($host, $port); $sphinx->SetConnectTimeout(1); $sphinx->SetRankingMode(SPH_RANK_PROXIMITY_BM25); $sphinx->SetArrayResult(true); return $sphinx; } // --------------------------------------------------------------------------- // // compare // --------------------------------------------------------------------------- // function compare($a1, $a2) { $a1 = strtoupper($a1); $a2 = strtoupper($a2); $a1 = str_replace('&', 'ET', $a1); $a2 = str_replace('&', 'ET', $a2); if (DEBUG) { print 'Compare: '.$a1.' avec: '.$a2; } $l1 = levenshtein($a1, $a2); $t1 = explode(' ', $a1); $t2 = explode(' ', $a2); sort($t1); sort($t2); $a1 = implode(' ', $t1); $a2 = implode(' ', $t2); $l2 = levenshtein($a1, $a2); $l = min($l1, $l2); $ret = 1 - $l / max(strlen($a1), strlen($a2)); debugln(' levenshtein: '.$l.' pertinence: '.$ret); return $ret; } // --------------------------------------------------------------------------- // // reponse // --------------------------------------------------------------------------- // function reponse(&$resSphinx, &$resDB, $criteres, $time, $formR, $form2crit, $deb, $ligneDir = array()) { $criteresRet = array(); foreach ($form2crit as $field => $letter) { if (preg_match("/$letter/", $criteres)) { if (empty($formR[$field]) == false) { $criteresRet[] = strtoupper($formR[$field]); } } } $ret['criteres'] = $criteresRet; //$ret['nbReponses'] = $resDB->num_rows; $ret['nbReponsesTotal'] = $resSphinx['total']; $ret['duree'] = $time; $pertinence_generale = 100; if ($formR['type'] == 'ent') { //$pertinence_generale = 100 - 5 * $resSphinx['pass'];; $tot = 0; $num = 0; $poids = array( 'I' => 10, 'T' => 1, 'S' => 9, 'E' => 8, 'P' => 7, 'D' => 6, 'L' => 4, 'V' => 5, 'N' => 2, 'R' => 3, ); foreach ($form2crit as $field => $letter) { if (empty($formR[$field]) == false) { $tot += $poids[$letter]; if (preg_match("/$letter/", $criteres)) { $num += $poids[$letter]; } } } $pertinence_generale *= $num / $tot; $pertinence_generale = intval($pertinence_generale); //print 'Pertinence generale: '.$pertinence_generale.'
'; } if ( is_object($resDB) ) { $resDB->data_seek(0); for ($i = 0; $i < $resDB->num_rows; $i++) { $ligne = $resDB->fetch_assoc(); //file_put_contents('test.log', print_r($ligne,1), FILE_APPEND); $ret['reponses'][$i]['id'] = $ligne['id']; $pertinence = $pertinence_generale; if ($formR['type'] == 'ent') { if (empty($formR['raisonSociale']) == false) { $pertinence *= compare($formR['raisonSociale'], $ligne['raisonSociale']); } if (empty($formR['voie']) == false) { $pertinence *= compare($formR['voie'], $ligne['adr_typeVoie'].' '.$ligne['adr_libVoie']); } if (empty($formR['ville']) == false) { $pertinence *= compare($formR['ville'], $ligne['adr_ville']); } } $ret['reponses'][$i]['Pertinence'] = $pertinence; $ret['reponses'][$i]['Source'] = $ligne['source']; $ret['reponses'][$i]['SourceId'] = $ligne['source_id']; $ret['reponses'][$i]['Siret'] = $ligne['siret']; $ret['reponses'][$i]['Siren'] = $ligne['siren']; $ret['reponses'][$i]['Nic'] = $ligne['nic']; $ret['reponses'][$i]['Siege'] = $ligne['siege']; $ret['reponses'][$i]['Nom'] = $ligne['raisonSociale']; $ret['reponses'][$i]['Nom2'] = ''; $ret['reponses'][$i]['Sigle'] = $ligne['sigle']; $ret['reponses'][$i]['Enseigne'] = $ligne['enseigne']; $adresse = ''; if ( intval($ligne['adr_dep'])==99 && intval($ligne['adr_num'])==0) { $adresse.= $ligne['adr_typeVoie'].' '.$ligne['adr_libVoie']; } else { if ( !empty($ligne['adr_num']) ) { $adresse.= $ligne['adr_num'].' '; } if ( !empty($ligne['adr_btq']) ) { $adresse.= $ligne['adr_btq'].' '; } if ( !empty($ligne['adr_typeVoie']) ) { $adresse.= $ligne['adr_typeVoie'].' '; } if ( !empty($ligne['adr_libVoie']) ) { $adresse.= $ligne['adr_libVoie'].' '; } $adresse = trim($adresse); } $ret['reponses'][$i]['Adresse'] = $adresse; $ret['reponses'][$i]['Adresse2'] = $ligne['adr_comp']; $ret['reponses'][$i]['CP'] = $ligne['adr_cp']; $ret['reponses'][$i]['Ville'] = $ligne['adr_ville']; $ret['reponses'][$i]['Pays'] = empty($ligne['pays']) ? 'France' : $ligne['pays'] ; $ret['reponses'][$i]['Tel'] = $ligne['tel']; $ret['reponses'][$i]['Fax'] = $ligne['fax']; $ret['reponses'][$i]['FJ'] = $ligne['cj']; $ret['reponses'][$i]['Actif'] = $ligne['actif']; $ret['reponses'][$i]['NafEtab'] = $ligne['ape_etab']; $ret['reponses'][$i]['NafEnt'] = $ligne['ape_entrep']; if ($formR['type']=='dir') { // Dirigeant $ret['reponses'][$i]['DirRs'] = ''; $ret['reponses'][$i]['DirNom'] = $ligneDir[$i]['nom']; $ret['reponses'][$i]['DirPrenom'] = $ligneDir[$i]['prenom']; $ret['reponses'][$i]['DirNomUsage'] = $ligneDir[$i]['naissance_nom']; $ret['reponses'][$i]['DirDateNaiss'] = $ligneDir[$i]['naissance_date']; $ret['reponses'][$i]['DirLieuNaiss'] = $ligneDir[$i]['naissance_lieu']; $ret['reponses'][$i]['DirDateEffet'] = ''; $ret['reponses'][$i]['DirFonction'] = $ligneDir[$i]['fonction_lib']; $ret['reponses'][$i]['DirDepart'] = ''; } elseif ($formR['type']=='act') { // Actionnaire $ret['reponses'][$i]['ActNomRs'] = $ligne['ActRaisonSociale']; $ret['reponses'][$i]['ActPays'] = $ligne['ActPays']; $ret['reponses'][$i]['ActDateLien'] = $ligne['dateLien']; $ret['reponses'][$i]['ActActif'] = $ligne['ActActif']; $ret['reponses'][$i]['ActPmin'] = $ligne['ActPmin']; } } } //file_put_contents('test.log', print_r($ret,1), FILE_APPEND); if ($formR['type'] == 'ent') { $ret['pass'] = $resSphinx['pass']; } $ret['nbReponses'] = count($ret['reponses']); if (DEBUG) { print '
';
        print_r($ret);
        print '
'; } return $ret; } // --------------------------------------------------------------------------- // // Recherche par dirigeant // --------------------------------------------------------------------------- // function rechercheDir(&$formR, $deb, $nbRep, $max) { $gDatabaseJO = databaseJO(); // Duree totale $total_time = 0; $sphinx = clientSphinx($formR); if ($sphinx == false) { return array('nbReponses' => 0, 'nbReponsesTotal' => 0, 'duree' => $total_time, 'erreur' => 'Formulaire vide'); } $criteresSphinx = array('nom' => '@nom', 'prenom' => '@prenom', 'ville' => '@naissance_lieu'); $form2crit = array('nom' => 'N', 'prenom' => 'P', 'dirDateNaissAAAA' => 'A', 'dirDateNaissMM' => 'M', 'dirDateNaissJJ' => 'J', 'departement' => 'D', 'ville' => 'V'); $index = 'dir'; $mode = SPH_MATCH_EXTENDED2; $pass = 0; $criteres = 'NPAMJDV'; initSphinx($sphinx, $mode, $pass, $deb, $nbRep, $max); while (empty($criteres) == false) { debugln("criteres: $criteres"); filtreDateNaiss($formR, $criteres, $sphinx); filtreAdresse($formR, $criteres, $sphinx); $requete_sphinx = ''; foreach ($formR as $label => $valeur) { if (empty($valeur) == false && isset($criteresSphinx[$label]) == true && strstr($criteres, $form2crit[$label]) != false) { if ($label == 'prenom') { $requete_sphinx .= $criteresSphinx[$label]. ' "'.$valeur.'"/1 '; } else { $requete_sphinx .= $criteresSphinx[$label].' '.$valeur.' '; } } } debugln("requete='$requete_sphinx'"); $sphinx->SetSortMode(SPH_SORT_EXTENDED, 'actif DESC'); $resSphinx = $sphinx->Query($requete_sphinx, $index); if ($resSphinx != false) { $total_time += $resSphinx['time']; } if ($resSphinx != false && $resSphinx['total'] > 0) { break; } $criteres = criteresDir($criteres, $index); $sphinx->resetFilters(); } afficheStatusSphinx($sphinx, $resSphinx); if ($resSphinx == false) { return array('nbReponses' => 0, 'nbReponsesTotal' => 0, 'duree' => $total_time, 'erreur' => $sphinx->GetLastError(), 'criteres' => $criteres); } if ($resSphinx['total'] == 0) { return array('nbReponses' => 0, 'nbReponsesTotal' => 0, 'duree' => $total_time, 'criteres' => $criteres); } if (DEBUG) { $base2form = array('adr_dep' => 'departement', 'nom' => 'nom', 'prenom' => 'prenom', 'naissance_nom' => 'nom', 'naissance_date' => 'dirDateNaissAAAA', 'naissance_lieu' => 'ville'); afficheDB($resSphinx, $formR, $form2crit, 'dirigeants', $base2form, $deb, $nbRep); } // Recherche des sieges if ($gDatabaseJO == false) { return array('nbReponses' => 0, 'nbReponsesTotal' => $resSphinx['total'], 'duree' => $total_time, 'erreur' => 'Base inaccessible'); } if (isset($resSphinx['matches']) == false) { return array('nbReponses' => 0, 'nbReponsesTotal' => $resSphinx['total'], 'duree' => $total_time, 'erreur' => 'Aucun résultat'); } /* file_put_contents('test.log', print_r($formR,1)); file_put_contents('test.log', $sphinx->GetLastError()."\n", FILE_APPEND); file_put_contents('test.log', 'TEST='.print_r($resSphinx,1), FILE_APPEND); */ $requeteDB = "SELECT d.nom, d.prenom, d.naissance_nom, d.naissance_date, d.naissance_lieu, l.libelle AS fonction_lib, e.id, CONCAT(LPAD(e.siren,9,0),LPAD(e.nic,5,0)) AS siret, e.source, e.source_id, LPAD(e.siren,9,0) AS siren, LPAD(e.nic,5,0) AS nic, e.siege, e.raisonSociale, e.sigle, e.enseigne, e.adr_num, e.adr_btq, e.adr_typeVoie, e.adr_libVoie, e.adr_comp, LPAD(e.adr_cp,5,0) AS adr_cp, e.adr_ville, libPays AS pays, e.adr_dep, e.adr_com, LPAD(e.tel,10,0) AS tel, LPAD(e.fax,10,0) AS fax, e.cj, e.actif, e.ape_etab, e.ape_entrep FROM jo.dirigeants d, jo.etablissements e LEFT OUTER JOIN jo.tabPays ON codePaysInsee = IF(adr_dep=99,adr_com,null), jo.bodacc_fonctions l WHERE d.fonction_code=l.codeFct AND d.id IN ("; $i = 0; foreach ($resSphinx['matches'] as $id => $element) { if($i > 0) $requeteDB.= ','; $requeteDB.= $element['id']; $i++; } $requeteDB .= ") AND e.id = ("; $requeteDB .= "SELECT tmp.id FROM jo.etablissements tmp "; $requeteDB .= "WHERE tmp.siren=d.siren ORDER by tmp.actif DESC, tmp.siege DESC LIMIT 1"; $requeteDB .= ") ORDER BY e.actif DESC, e.siege DESC, e.rang DESC"; //file_put_contents('test.log', $requeteDB); debugln(); debugln("requeteDB='$requeteDB'"); $resDB = $gDatabaseJO->query($requeteDB); if (!$resDB) { file_put_contents(LOG_PATH . '/mysql.log', $gDatabaseJO->error, FILE_APPEND); } // Reponse $ligneDir = array(); for ($i = 0; $i < $resDB->num_rows; $i++) { $ligne = $resDB->fetch_assoc(); $nom = $ligne['nom']; if ( $ligne['naissance_nom']!='' ) { $nom.= " née ".$ligne['naissance_nom']; } $ligneDir[$i] = array( 'id' => $ligne['id'], 'nom' => $nom, 'prenom' => $ligne['prenom'], 'fonction_lib' => $ligne['fonction_lib'], 'naissance_nom' => $ligne['naissance_nom'], 'naissance_date' => $ligne['naissance_date'], 'naissance_lieu' => $ligne['naissance_lieu'] ); } debugln(); debugln("requeteDB='$requeteDB'"); return reponse($resSphinx, $resDB, $criteres, $total_time, $formR, $form2crit, $deb, $ligneDir); } // --------------------------------------------------------------------------- // // Recherche Histo // --------------------------------------------------------------------------- // function rechercheHisto($formR, $deb, $nbRep, $max) { $gDatabaseJO = databaseJO(); $sphinx = clientSphinx($formR); $index = 'histo'; $mode = 'SPH_MATCH_EXTENDED'; $pass = 0; initSphinx($sphinx, $mode, $pass, $deb, $nbRep, $max); if (!empty($formR['annee1'])) $sphinx->SetFilter('annee1', array(0=>$formR['annee1'])); $sphinx->SetRankingMode ( SPH_RANK_PROXIMITY_BM25 ); $sphinxreturn = $sphinx->Query($formR['recherche'], $index); $gDatabaseJO->select_db('histobodacc'); foreach ( $sphinxreturn['matches'] as $doc => $docinfo ) { $requette = "SELECT Histo as Loc, id, nomFichier, annee1, bod, texte FROM bodacc_cor WHERE id=$doc"; $req = $gDatabaseJO->query($requette); $ligne = $req->fetch_assoc(); $etab = $ligne[0]; $tabRet[] = array( 'Localisation' => $etab['Loc'], 'id' => $doc, 'Pertinence' => $docinfo['weight'], 'Fichier' => $etab['nomFichier'], 'Annee' => $etab['annee1'], 'Code' => $etab['bod'], 'Texte' => $etab['texte'], ); } return array( 'results' => $tabRet, 'nbRet' => $sphinxreturn['total'], 'nbTot' => $sphinxreturn['total_found'], 'duration' => $sphinxreturn['time'], 'words' => $sphinxreturn['words'], ); } // --------------------------------------------------------------------------- // // Recherche par actionnaire // --------------------------------------------------------------------------- // function constructRequete($formR, $sphinxCriteres) { foreach($sphinxCriteres as $name => $critere) { if ($name == 'Req') { $requete .= $formR[$critere]; } if ($name[0] == '@') { if(!empty($formR[$critere])) $parametres .= ' '.$name.' '.$formR[$critere]; } } echo $sphinxRequete = '"'.$requete.'" '.$parametres; return ($sphinxRequete); } function rechercheAct($formR, $deb, $nbRep, $max) { $gDatabaseJO = databaseJO(); $sphinx = clientSphinx($formR); $sphinx->SetSortMode(SPH_SORT_EXTENDED, 'actif DESC'); $index = 'act'; $mode = 'SPH_MATCH_EXTENDED2'; $pass = 0; initSphinx($sphinx, $mode, $pass, $deb, $nbRep, $max); $Criteres = array( 'Siren2' => 'siren', 'Req' => 'actNomRS', '@Pays' => 'pays', //'PDetention' => 'pctMax', ); $form2crit = array( 'actNomRS' => 'N', 'pays' => 'P', 'pctMax' => 'M' ); $Requete = constructRequete($formR, $Criteres); if(!empty($formR['pctMin'])) $sphinx->SetFilterFloatRange('PDetention', $formR['pctMin'], 99); if(!empty($formR['pctMax'])) $sphinx->SetFilterFloatRange('PDetention', $formR['pctMin'], 99); if(!empty($formR['pctMin']) && !empty($formR['pctMax'])) $sphinx->SetFilterFloatRange('PDetention', $formR['pctMin'], $formR['pctMax']); $sphinxreturn = $sphinx->Query($Requete, $index); /* file_put_contents('test.log', print_r($formR,1)); file_put_contents('test.log', $sphinx->GetLastError()."\n", FILE_APPEND); file_put_contents('test.log', 'TEST='.print_r($sphinxreturn,1), FILE_APPEND); */ $criteres = 'NPM'; $requette = " (SELECT /*Liens*/ l.PDetention AS ActPmin, l.MajMin, l.dateEffetLien AS dateLien, IF(l.dateUpdate>l.dateInsert,l.dateUpdate,l.dateInsert) AS date, /*Participation*/ CONCAT(LPAD(e.siren,9,0), LPAD(e.nic,5,0)) AS siret, LPAD(par.siren,9,0) AS siren, LPAD(e.nic,5,0) AS nic, e.siege, par.RS AS raisonSociale, /*sigle*/ /*enseigne*/ par.actif, par.PpPm, par.adresse_num AS adr_num, par.adresse_codvoie AS adr_typeVoie, par.adresse_libvoie AS adr_libVoie, par.adresse_comp AS adr_comp, LPAD(par.adresse_cp,5,0) AS adr_cp, par.adresse_ville AS adr_ville, p1.libPays AS pays, LPAD(par.tel,10,0) AS tel, LPAD(par.fax,10,0) AS fax, /*Actionnaire*/ act.id AS ActId, act.actif AS ActActif, act.RS AS ActRaisonSociale, p2.libPays AS ActPays FROM liens2 l, liensRef par, liensRef act, tabPays p1, tabPays p2, etablissements e WHERE par.id = l.idPar AND act.id = l.idAct AND p1.codPays3 = par.adresse_pays AND p2.codPays3 = act.adresse_pays AND e.siren = par.siren AND par.siren >1000 AND l.id IN ( "; $i = 0; foreach ($sphinxreturn['matches'] as $id => $element) { if($i > 0) $requette.= ','; $requette.= $element['id']; $i++; } $requette.= " ) ) UNION (SELECT /*Liens*/ l.PDetention AS ActPmin, l.MajMin, l.dateEffetLien AS dateLien, IF(l.dateUpdate>l.dateInsert,l.dateUpdate,l.dateInsert) AS date, /*Participation*/ CONCAT(LPAD(e.siren,9,0), LPAD(e.nic,5,0)) AS siret, LPAD(par.siren,9,0) AS siren, LPAD(e.nic,5,0) AS nic, e.siege, par.RS AS raisonSociale, /*sigle*/ /*enseigne*/ par.actif, par.PpPm, par.adresse_num AS adr_num, par.adresse_codvoie AS adr_typeVoie, par.adresse_libvoie AS adr_libVoie, par.adresse_comp AS adr_comp, LPAD(par.adresse_cp,0,5) AS adr_cp, par.adresse_ville AS adr_ville, p1.libPays AS pays, LPAD(par.tel,10,0) AS tel, LPAD(par.fax,10,0) AS fax, /*Actionnaire*/ act.id AS ActId, act.actif AS ActActif, act.RS AS ActRaisonSociale, p2.libPays AS ActPays FROM liens2 l, liensRef par, liensRef act, tabPays p1, tabPays p2, etablissements e WHERE par.id = l.idPar AND act.id = l.idAct AND p1.codPays3 = par.adresse_pays AND p2.codPays3 = act.adresse_pays AND e.source =6 AND e.source_id = l.idPar AND l.id IN ( "; $i = 0; foreach ($sphinxreturn['matches'] as $id => $element) { if($i > 0) $requette.= ','; $requette.= $element['id']; $i++; } $requette.= " ) ) ORDER BY actif DESC, siege DESC, nic DESC"; $req = $gDatabaseJO->query($requette); return reponse($sphinxreturn, $req, $criteres, $sphinxreturn['time'], $formR, $form2crit, $deb, array()); } // --------------------------------------------------------------------------- // // Recherche entreprise // --------------------------------------------------------------------------- // function rechercheEnt(&$formR, $deb, $nbRep, $max, $sirenValide = false) { $gDatabaseJO = databaseJO(); // Duree totale $total_time = 0; $sphinx = clientSphinx($formR); if ($sphinx == false) { return array('nbReponses' => 0, 'nbReponsesTotal' => 0, 'duree' => $total_time, 'erreur' => 'Formulaire vide'); } $criteresSphinx = array( //'siret' => '@siren', 'raisonSociale' => '@nom', //'numVoie' => '@adr_num', //'voie' => '@(adr_typeVoie,adresse)', 'voie' => '@adresse', //'cpVille' => '@(adr_dep,adr_cp,ville)', 'ville' => '@ville', 'telFax' => '@(tel,fax)', 'naf' => '@ape_etab', //'fj' => '@cj', ); $form2crit = array( 'siret' => 'I', 'telFax' => 'T', 'raisonSociale' => 'S', 'enseigne' => 'E', 'prenom' => 'P', 'departement' => 'D', 'localite' => 'L', 'ville' => 'V', 'numVoie' => 'N', 'voie' => 'R' ); filtreCaracteresSpeciaux($formR); // Quorum $quorum_actif = false; $quorum = array(); // Premiere requete sans la gestion des mots non significatifs // et avec concatenation de tous les mots de la raison sociale $index = 'ent'; $mode = SPH_MATCH_EXTENDED2; $pass = 0; $criteres = 'ITSEPDLVNR'; initSphinx($sphinx, $mode, $pass, $deb, $nbRep, $max); $resSphinx = premiereRequeteSphinx($sphinx, $index, $formR, $criteres, $criteresSphinx, $form2crit, $sirenValide); afficheStatusSphinx($sphinx, $resSphinx); if ($resSphinx == false) { return array('nbReponses' => 0, 'nbReponsesTotal' => 0, 'duree' => $total_time, 'erreur' => $sphinx->GetLastError(), 'pass' => $pass, 'criteres' => $criteres); } $total_time += $resSphinx['time']; if ($resSphinx['total'] == 0) { debugln('Sans la gestion des mots non significatifs'); debugln(); $resSphinx = requeteSphinx($sphinx, $index, $formR, $criteres, $criteresSphinx, $form2crit, false, $quorum, $sirenValide); afficheStatusSphinx($sphinx, $resSphinx); if ($resSphinx == false) { return array('nbReponses' => 0, 'nbReponsesTotal' => 0, 'duree' => $total_time, 'erreur' => $sphinx->GetLastError(), 'pass' => $pass, 'criteres' => $criteres); } $total_time += $resSphinx['time']; } if ($resSphinx['total'] == 0 && isset($formR['departement']) == true) { debugln('Sans la gestion des mots non significatifs et sans la localité'); debugln(); $criteres = 'ITSEPD VNR'; $sphinx->resetFilters(); $resSphinx = requeteSphinx($sphinx, $index, $formR, $criteres, $criteresSphinx, $form2crit, false, $quorum, $sirenValide); afficheStatusSphinx($sphinx, $resSphinx); if ($resSphinx == false) { return array('nbReponses' => 0, 'nbReponsesTotal' => 0, 'duree' => $total_time, 'erreur' => $sphinx->GetLastError(), 'pass' => $pass, 'criteres' => $criteres); } $total_time += $resSphinx['time']; $criteres = 'ITSEPDLVNR'; } $total_premiere_requete = $resSphinx['total']; if ($total_premiere_requete == 0 || $total_premiere_requete > 500) { // "huit a huit" donne 414 $index = 'ent_mns'; if (SPHINX_ENT_VERSION == 2) { $index = 'ent'; } // Requete sans les mots non significatifs // pour connaitre le nombre de mots trouves pour chaque champ alpha debugln('Avec la gestion des mots non significatifs et avec quorum si l\'adresse est complete'); $raisonSociale = $formR['raisonSociale']; if ((empty($formR['ville']) == false || empty($formR['departement']) == false) && empty($formR['numVoie']) == false && empty($formR['voie']) == false) { $quorum = array('raisonSociale' => 2); $quorum_actif = true; } $resSphinx = requeteSphinx($sphinx, $index, $formR, $criteres, $criteresSphinx, $form2crit, $quorum_actif, $quorum, $sirenValide); afficheStatusSphinx($sphinx, $resSphinx); if ($resSphinx == false) { return array('nbReponses' => 0, 'nbReponsesTotal' => 0, 'duree' => $total_time, 'erreur' => $sphinx->GetLastError(), 'pass' => $pass, 'criteres' => $criteres); } $total_time += $resSphinx['time']; $quorum_actif = false; $quorum = array(); $formR['raisonSociale'] = $raisonSociale; if ($resSphinx['total'] == 0) { $pass = 1; $criteres = 'ITSEPDLVNR'; initSphinx($sphinx, $mode, $pass, $deb, $nbRep, $max); // Nombre de mots pour le quorum if (isset($formR['raisonSociale']) == true) { $quorum['raisonSociale'] = nombreDeMots($resSphinx, $formR['raisonSociale']); } if (isset($formR['voie']) == true) { $quorum['voie'] = nombreDeMots($resSphinx, $formR['voie']); } if (isset($formR['ville']) == true) { $quorum['ville'] = nombreDeMots($resSphinx, $formR['ville']); } } } while ($pass > 0) { filtreSiege($formR, $criteres, $sphinx); filtreActif($formR, $criteres, $sphinx); // Requete Sphinx $resSphinx = requeteSphinx($sphinx, $index, $formR, $criteres, $criteresSphinx, $form2crit, $quorum_actif, $quorum, $sirenValide); afficheStatusSphinx($sphinx, $resSphinx); if ($resSphinx == false) { return array('nbReponses' => 0, 'nbReponsesTotal' => 0, 'duree' => $total_time, 'erreur' => $sphinx->GetLastError(), 'pass' => $pass, 'criteres' => $criteres); } $total_time += $resSphinx['time']; if ($resSphinx['total'] > 0 && ($total_premiere_requete == 0 || $total_premiere_requete >= $resSphinx['total'])) { break; } if (isset($sequence) == false) { // Criteres de depart $criteres = criteresDeDepart($formR, $form2crit); debugln("criteres de depart='$criteres'"); // Sequence $sequence = nouvelleSequence($criteres); if ($sequence == array()) { debugln('fin des sequences'); if (changePass($pass, $mode, $index, $quorum_actif, $formR) == true) { $criteres = 'ITSEPDLVNR'; initSphinx($sphinx, $mode, $pass, $deb, $nbRep, $max); $sequencePos = 0; continue; } else { break; } } $sequencePos = 0; if (DEBUG) { print "sequence='"; foreach ($sequence as $valeur) { print $valeur.' '; } println("'"); } // Pour les nouveaux criteres $comb2crit = array( '00'=> ' ', '11'=> 'IT ', '12'=> 'I ', '13'=> ' T ', '21'=> ' D NR', '22'=> ' D VNR', '23'=> ' DL N ', '24'=> ' DL NR', '25'=> ' P NR', '26'=> ' P VN ', '27'=> ' PD VNR', '28'=> ' PD N ', '30'=> ' S ', '31'=> ' SE ', '32'=> ' SE R', '33'=> ' SE N ', '34'=> ' SE NR', '35'=> ' SE V ', '36'=> ' SE V R', '37'=> ' SE VNR', '40'=> ' SE D ', '41'=> ' SE D N ', '42'=> ' SE D V ', '43'=> ' SE D V R', '44'=> ' SE D VN ', '45'=> ' SE D VNR', '46'=> ' SE DL ', '47'=> ' SE DL R', '48'=> ' SE DL N ', '49'=> ' SE DL NR', '60'=> ' SEP ', '61'=> ' SEP N ', '62'=> ' SEP NR', '63'=> ' SEP V ', '64'=> ' SEP V R', '65'=> ' SEP VNR', '71'=> ' SEPD ', '72'=> ' SEPD R', '73'=> ' SEPD N ', '74'=> ' SEPD NR', '75'=> ' SEPD V ', '76'=> ' SEPD V R', '77'=> ' SEPD VN ', '78'=> ' SEPD VNR', '81'=> ' SEPDL R', '82'=> ' SEPDL N ', '83'=> ' SEPDL NR', ); } // Combinaison $combinaison = nouvelleCombinaison($sequence, $sequencePos, $pass, $index, $mode); if ($combinaison == '') { debugln('fin des combinaisons'); if (changePass($pass, $mode, $index, $quorum_actif, $formR) == true) { $criteres = 'ITSEPDLVNR'; initSphinx($sphinx, $mode, $pass, $deb, $nbRep, $max); $sequencePos = 0; continue; } else { break; } } debugln("combinaison='$combinaison'"); if (strlen($combinaison) == 3) { $combinaison = substr($combinaison, 0, 2); } // Nouveaux criteres $criteres = nouveauxCriteres($comb2crit, $combinaison); if ($criteres == '') { debugln("combinaison inconnue: '$combinaison'"); break; } debugln("nouveau criteres='$criteres'"); $sphinx->SetMatchMode($mode); $sphinx->resetFilters(); } $resSphinx['pass'] = $pass; // Reprise de la premiere requete si elle etait meilleure if ($pass > 0 && $total_premiere_requete > 0 && $total_premiere_requete < $resSphinx['total']) { $index = 'ent'; $mode = SPH_MATCH_EXTENDED2; $pass = 0; $criteres = 'ITSEPDLVNR'; initSphinx($sphinx, $mode, $pass, $deb, $nbRep, $max); $resSphinx = premiereRequeteSphinx($sphinx, $index, $formR, $criteres, $criteresSphinx, $form2crit, $sirenValide); $total_time += $resSphinx['time']; // Sans la gestion des mots non significatifs if ($resSphinx['total'] == 0) { $resSphinx = requeteSphinx($sphinx, $index, $formR, $criteres, $criteresSphinx, $form2crit, false, $quorum, $sirenValide); $total_time += $resSphinx['time']; } // Sans la gestion des mots non significatifs et sans la localité if ($resSphinx['total'] == 0 && isset($formR['departement']) == true) { $criteres = 'ITSEPD VNR'; $sphinx->resetFilters(); $resSphinx = requeteSphinx($sphinx, $index, $formR, $criteres, $criteresSphinx, $form2crit, false, $quorum, $sirenValide); $total_time += $resSphinx['time']; } $resSphinx['pass'] = $pass; } if ($resSphinx['total'] == 0) { return array( 'nbReponses' => 0, 'nbReponsesTotal' => 0, 'duree' => $total_time, 'pass' => $pass, 'criteres' => $criteres); } if (DEBUG) { $base2form = array( 'adr_dep' => 'departement', 'adr_cp' => 'localite', 'adr_num' => 'numVoie', 'adr_libVoie' => 'voie', 'adr_comp' => 'voie', 'adr_ville' => 'ville', 'raisonSociale' => 'raisonSociale', 'enseigne' => 'raisonSociale', 'sigle' => 'raisonSociale', 'identite_pre' => 'raisonSociale'); afficheDB($resSphinx, $formR, $form2crit, 'etablissements', $base2form, $deb, $nbRep); } //file_put_contents('test.log', print_r($resSphinx,1)); // Reponse if ($gDatabaseJO == false) { return array( 'nbReponses' => 0, 'nbReponsesTotal' => $resSphinx['total'], 'duree' => $total_time, 'erreur' => 'Base inaccessible'); } if (isset($resSphinx['matches']) == false) { return array( 'nbReponses' => 0, 'nbReponsesTotal' => $resSphinx['total'], 'duree' => $total_time, 'erreur' => 'Aucun résultat'); } $requeteDB = 'SELECT id, source, source_id, CONCAT(LPAD(siren,9,0),LPAD(nic,5,0)) AS siret, LPAD(siren,9,0) AS siren, LPAD(nic,5,0) AS nic, siege, raisonSociale, sigle, enseigne, adr_num, adr_btq, adr_typeVoie, adr_libVoie, adr_comp, LPAD(adr_cp,5,0) AS adr_cp, adr_ville, libPays AS pays, LPAD(tel,10,0) AS tel, LPAD(fax,10,0) AS fax, cj, actif, ape_etab, ape_entrep, (siren>200) AS sirenValide FROM etablissements LEFT OUTER JOIN tabPays ON codePaysInsee = IF(adr_dep=99,adr_com,null) WHERE id IN('. $i = 0; foreach ($resSphinx['matches'] as $id => $element) { if($i > 0) $requeteDB.= ','; $requeteDB.= $element['id']; $i++; } $requeteDB.= ') ORDER BY sirenValide DESC, actif DESC, siege DESC, rang DESC'; //file_put_contents('test.log', $requeteDB); debugln(); debugln("requeteDB='$requeteDB'"); $resDB = $gDatabaseJO->query($requeteDB); return reponse($resSphinx, $resDB, $criteres, $total_time, $formR,$form2crit, $deb); } // --------------------------------------------------------------------------- // // sommeDeControle // --------------------------------------------------------------------------- // function sommeDeControle($sn) { $s = 0; $n = strlen($sn); for ($i = 0; $i < $n; ++$i) { if ($i & 1) { $t = substr($sn, $n - $i - 1, 1) << 1; $s += ($t > 9)? $t - 9 : $t; } else { $s += substr($sn, $n - $i - 1, 1); } } return $s % 10; } // --------------------------------------------------------------------------- // // Verification du siret // --------------------------------------------------------------------------- // function verificationDuSiret($siret) { if (strlen($siret) == 14) { $sn = substr($siret, 0, 9); $st = $siret; } else if (strlen($siret) == 9) { $sn = $siret; $st = 0; } else { // TODO: message d'erreur et/ou correction return false; } // Verification du siren $s = sommeDeControle($sn); if ($s != 0) { // Correction du chiffre de controle $sr = (substr($sn, 8, 1) - $s + 10) % 10; $liste = array(substr($sn, 0, 8).$sr); // Transpositions for ($i = 0; $i < 8; ++$i) { $n1 = substr($sn, $i, 1); $n2 = substr($sn, $i + 1, 1); if ($n1 == $n2) { continue; } $p = ''; if ($i > 0) { $p .= substr($sn, 0, $i); } $p .= $n2; if ($i < 7) { $p .= $n1; } if ($i < 6) { $p .= substr($sn, $i + 2, 6 - $i); } if ($i & 1) { if ($i < 7) { if ($n1 >= 5) { $n1 -= 9; } if ($n2 >= 5) { $n2 -= 9; } } else { $n1 = ($n1 >= 5) ? ($n1 << 1) - 9 : ($n1 << 1); $n2 = ($n2 >= 5) ? ($n2 << 1) - 9 : ($n2 << 1); } $p .= ($sr + $n1 - $n2 + 10) % 10; } else { if ($n2 >= 5) { $n2 -= 9; } if ($n1 >= 5) { $n1 -= 9; } $p .= ($sr + $n2 - $n1 + 10) % 10; } $liste[] = $p; } // Substitutions for ($i = 0; $i < 8; ++$i) { $n = substr($sn, $i, 1); for ($j = 0; $j < 10; ++$j) { if ($j == $n) { continue; } $p = ''; if ($i > 0) { $p .= substr($sn, 0, $i); } $p .= $j; if ($i < 7) { $p .= substr($sn, $i + 1, 7 - $i); } if ($i & 1) { $n1 = ($n << 1); if ($n1 > 9) { $n1 -= 9; } $n2 = ($j << 1); if ($n2 > 9) { $n2 -= 9; } $p .= ($sr + $n1 - $n2 + 10) % 10; } else { $p .= ($sr + $n - $j + 10) % 10; } $liste[] = $p; } } return $liste; } if ($st == 0) { return false; } // Verification du siret if (sommeDeControle($st) != 0) { return array($sn); } return false; } // --------------------------------------------------------------------------- // // Recherche // --------------------------------------------------------------------------- // function recherche(&$formR, $deb = 0, $nbRep = 20, $max = 1000) { if ($formR['type'] == 'ent') { return rechercheEnt($formR, $deb, $nbRep, $max); } else if ($formR['type'] == 'dir') { return rechercheDir($formR, $deb, $nbRep, $max); } else if ($formR['type'] == 'act') { return rechercheAct($formR, $deb, $nbRep, $max); } else { debugln('Type de recherche inconnu'); return array('nbReponses' => 0, 'nbReponsesTotal' => 0, 'duree' => 0, 'erreur' => 'Type de recherche inconnu'); } } ?>