' : ' <'). ($search['fields'][$key]['inc'] ? '=' : ''). " '".$search['fields'][$key]['date']."'" ); } } } if (isset($search['fields']['cat'])) { if ($search['fields']['cat']['sub_inc']) { // searching all the categories id of sub-categories $cat_ids = get_subcat_ids($search['fields']['cat']['words']); } else { $cat_ids = $search['fields']['cat']['words']; } $local_clause = 'category_id IN ('.implode(',', $cat_ids).')'; array_push($clauses, $local_clause); } // adds brackets around where clauses $clauses = prepend_append_array_items($clauses, '(', ')'); $where_separator = implode( "\n ".$search['mode'].' ', $clauses ); $search_clause = $where_separator; return $search_clause; } /** * returns the list of items corresponding to the advanced search array * * @param array search * @return array */ function get_regular_search_results($search, $images_where) { global $conf; $forbidden = get_sql_condition_FandF( array ( 'forbidden_categories' => 'category_id', 'visible_categories' => 'category_id', 'visible_images' => 'id' ), "\n AND" ); $items = array(); $tag_items = array(); if (isset($search['fields']['tags'])) { $tag_items = get_image_ids_for_tags( $search['fields']['tags']['words'], $search['fields']['tags']['mode'] ); } $search_clause = get_sql_search_clause($search); if (!empty($search_clause)) { $query = ' SELECT DISTINCT(id) FROM '.IMAGES_TABLE.' i INNER JOIN '.IMAGE_CATEGORY_TABLE.' AS ic ON id = ic.image_id WHERE '.$search_clause; if (!empty($images_where)) { $query .= "\n AND ".$images_where; } $query .= $forbidden.' '.$conf['order_by']; $items = array_from_query($query, 'id'); } if ( !empty($tag_items) ) { switch ($search['mode']) { case 'AND': if (empty($search_clause)) { $items = $tag_items; } else { $items = array_values( array_intersect($items, $tag_items) ); } break; case 'OR': $before_count = count($items); $items = array_unique( array_merge( $items, $tag_items ) ); break; } } return $items; } if (function_exists('mb_strtolower')) { function transliterate($term) { return remove_accents( mb_strtolower($term) ); } } else { function transliterate($term) { return remove_accents( strtolower($term) ); } } function is_word_char($ch) { return ($ch>='0' && $ch<='9') || ($ch>='a' && $ch<='z') || ($ch>='A' && $ch<='Z') || ord($ch)>127; } /** * analyzes and splits the quick/query search query $q into tokens * q='john bill' => 2 tokens 'john' 'bill' * Special characters for MySql full text search (+,<,>,~) appear in the token modifiers. * The query can contain a phrase: 'Pierre "New York"' will return 'pierre' qnd 'new york'. */ function analyse_qsearch($q, &$qtokens, &$qtoken_modifiers) { $q = stripslashes($q); $tokens = array(); $token_modifiers = array(); $crt_token = ""; $crt_token_modifier = ""; $state = 0; for ($i=0; $i<~')==0 ) { //special full text modifier if (strlen($crt_token)) { $tokens[] = $crt_token; $token_modifiers[] = $crt_token_modifier; $crt_token = ""; $crt_token_modifier = ""; } $crt_token_modifier .= $ch; } elseif (preg_match('/[\s,.;!\?]+/', $ch)) { // white space if (strlen($crt_token)) { $tokens[] = $crt_token; $token_modifiers[] = $crt_token_modifier; $crt_token = ""; $crt_token_modifier = ""; } } else { $crt_token .= $ch; } break; case 1: // qualified with quotes switch ($ch) { case '"': $tokens[] = $crt_token; $token_modifiers[] = $crt_token_modifier; $crt_token = ""; $crt_token_modifier = ""; $state=0; break; default: $crt_token .= $ch; } break; } } if (strlen($crt_token)) { $tokens[] = $crt_token; $token_modifiers[] = $crt_token_modifier; } $qtokens = array(); $qtoken_modifiers = array(); for ($i=0; $i array(85,68,79...) * 'qs' => array( * 'matching_tags' => array of matching tags * 'matching_cats' => array of matching categories * 'matching_cats_no_images' =>array(99) - matching categories without images * )) * * @param string q * @param bool super_order_by * @param string images_where optional aditional restriction on images table * @return array */ function get_quick_search_results($q, $super_order_by, $images_where='') { global $user, $conf; $search_results = array( 'items' => array(), 'qs' => array('q'=>stripslashes($q)), ); $q = trim($q); if (empty($q)) { return $search_results; } analyse_qsearch($q, $tokens, $token_modifiers); $q_like_field = '@@__db_field__@@'; //something never in a search $q_like_clause = get_qsearch_like_clause($tokens, $token_modifiers, $q_like_field ); // Step 1 - first we find matches in #images table =========================== $where_clauses='MATCH(i.name, i.comment) AGAINST( \''.$q.'\' IN BOOLEAN MODE)'; if (!empty($q_like_clause)) { $where_clauses .= ' OR '. str_replace($q_like_field, 'CONVERT(file, CHAR)', $q_like_clause); $where_clauses = '('.$where_clauses.')'; } $where_clauses = array($where_clauses); if (!empty($images_where)) { $where_clauses[]='('.$images_where.')'; } $where_clauses[] .= get_sql_condition_FandF ( array( 'visible_images' => 'i.id' ), null, true ); $query = ' SELECT i.id, MATCH(i.name, i.comment) AGAINST( \''.$q.'\' IN BOOLEAN MODE) AS weight FROM '.IMAGES_TABLE.' i WHERE '.implode("\n AND ", $where_clauses); $by_weights=array(); $result = pwg_query($query); while ($row = pwg_db_fetch_assoc($result)) { // weight is important when sorting images by relevance if ($row['weight']) { $by_weights[(int)$row['id']] = 2*$row['weight']; } else {//full text does not match but file name match $by_weights[(int)$row['id']] = 2; } } // Step 2 - search tags corresponding to the query $q ======================== $transliterated_tokens = array(); $token_tags = array(); foreach ($tokens as $token) { $transliterated_tokens[] = transliterate($token); $token_tags[] = array(); } // Step 2.1 - find match tags for every token in the query search $all_tags = array(); $query = ' SELECT id, name, url_name, COUNT(image_id) AS nb_images FROM '.TAGS_TABLE.' INNER JOIN '.IMAGE_TAG_TABLE.' ON id=tag_id GROUP BY id'; $result = pwg_query($query); while ($tag = pwg_db_fetch_assoc($result)) { $transliterated_tag = transliterate($tag['name']); // find how this tag matches query tokens for ($i=0; $i0) { if (! is_word_char($transliterated_tag[$word_begin-1]) ) break; $word_begin--; } $word_end = $pos + $token_len; while ($word_end 4) $this_score = 0; } if ($this_score>0) $match = max($match, $this_score ); $pos++; } if ($match) { $tag_id = (int)$tag['id']; $all_tags[$tag_id] = $tag; $token_tags[$i][] = array('tag_id'=>$tag_id, 'score'=>$match); } } } $search_results['qs']['matching_tags']=$all_tags; // Step 2.2 - reduce matching tags for every token in the query search $score_cmp_fn = create_function('$a,$b', 'return 100*($b["score"]-$a["score"]);'); foreach ($token_tags as &$tt) { usort($tt, $score_cmp_fn); $nb_images = 0; $prev_score = 0; for ($j=0; $j 200 && $prev_score > $tt[$j]['score'] ) {// "many" images in previous tags and starting from this tag is less relevent $tt = array_slice( $tt, 0, $j); break; } $nb_images += $all_tags[ $tt[$j]['tag_id'] ]['nb_images']; $prev_score = $tt[$j]['score']; } } // Step 2.3 - get the images for tags for ($i=0; $i 'cat_id' ), "\n AND" ); $result = pwg_query($query); while ($row = pwg_db_fetch_assoc($result)) { // weight is important when sorting images by relevance if ($row['nb_images']==0) { $search_results['qs']['matching_cats_no_images'][] = $row; } else { $search_results['qs']['matching_cats'][$row['id']] = $row; } } if ( empty($by_weights) and empty($search_results['qs']['matching_cats']) ) { return $search_results; } // Step 4 - now we have $by_weights ( array image id => weight ) that need // permission checks and/or matching categories to get images from $where_clauses = array(); if ( !empty($by_weights) ) { $where_clauses[]='i.id IN (' . implode(',', array_keys($by_weights)) . ')'; } if ( !empty($search_results['qs']['matching_cats']) ) { $where_clauses[]='category_id IN ('. implode(',',array_keys($search_results['qs']['matching_cats'])).')'; } $where_clauses = array( '('.implode("\n OR ",$where_clauses).')' ); if (!empty($images_where)) { $where_clauses[]='('.$images_where.')'; } $where_clauses[] = get_sql_condition_FandF( array ( 'forbidden_categories' => 'category_id', 'visible_categories' => 'category_id', 'visible_images' => 'i.id' ), null,true ); $query = ' SELECT DISTINCT(id) FROM '.IMAGES_TABLE.' i INNER JOIN '.IMAGE_CATEGORY_TABLE.' AS ic ON id = ic.image_id WHERE '.implode("\n AND ", $where_clauses)."\n". $conf['order_by']; $allowed_images = array_from_query( $query, 'id'); if ( $super_order_by or empty($by_weights) ) { $search_results['items'] = $allowed_images; return $search_results; } $allowed_images = array_flip( $allowed_images ); $divisor = 5.0 * count($allowed_images); foreach ($allowed_images as $id=>$rank ) { $weight = isset($by_weights[$id]) ? $by_weights[$id] : 1; $weight -= $rank/$divisor; $allowed_images[$id] = $weight; } arsort($allowed_images, SORT_NUMERIC); $search_results['items'] = array_keys($allowed_images); return $search_results; } /** * returns an array of 'items' corresponding to the search id * * @param int search id * @param string images_where optional aditional restriction on images table * @return array */ function get_search_results($search_id, $super_order_by, $images_where='') { $search = get_search_array($search_id); if ( !isset($search['q']) ) { $result['items'] = get_regular_search_results($search, $images_where); return $result; } else { return get_quick_search_results($search['q'], $super_order_by, $images_where); } } ?>