similarface

Sphinx之配置文件

#
# Sphinx configuration file sample
#
# WARNING! While this sample file mentions all available options,
# it contains (very) short helper descriptions only. Please refer to
# doc/sphinx.html for details.
#

#############################################################################
## data source definition
#############################################################################

source src1
{
    # data source type. mandatory, no default value
    # known types are mysql, pgsql, mssql, xmlpipe, xmlpipe2, odbc
    type            = mysql

    #####################################################################
    ## SQL settings (for 'mysql' and 'pgsql' types)
    #####################################################################

    # some straightforward parameters for SQL source types
    sql_host        = localhost
    sql_user        = test
    sql_pass        =
    sql_db            = test
    sql_port        = 3306    # optional, default is 3306

    # UNIX socket name
    # optional, default is empty (reuse client library defaults)
    # usually '/var/lib/mysql/mysql.sock' on Linux
    # usually '/tmp/mysql.sock' on FreeBSD
    #
    # sql_sock        = /tmp/mysql.sock


    # MySQL specific client connection flags
    # optional, default is 0
    #
    # mysql_connect_flags    = 32 # enable compression

    # MySQL specific SSL certificate settings
    # optional, defaults are empty
    #
    # mysql_ssl_cert        = /etc/ssl/client-cert.pem
    # mysql_ssl_key        = /etc/ssl/client-key.pem
    # mysql_ssl_ca        = /etc/ssl/cacert.pem

    # MS SQL specific Windows authentication mode flag
    # MUST be in sync with charset_type index-level setting
    # optional, default is 0
    #
    # mssql_winauth        = 1 # use currently logged on user credentials


    # ODBC specific DSN (data source name)
    # mandatory for odbc source type, no default value
    #
    # odbc_dsn        = DBQ=C:\data;DefaultDir=C:\data;Driver={Microsoft Text Driver (*.txt; *.csv)};
    # sql_query        = SELECT id, data FROM documents.csv


    # ODBC and MS SQL specific, per-column buffer sizes
    # optional, default is auto-detect
    #
    # sql_column_buffers    = content=12M, comments=1M


    # pre-query, executed before the main fetch query
    # multi-value, optional, default is empty list of queries
    # sql_query_pre 查询预处理 比如设置字符集 下面的
    # sql_query_pre        = SET NAMES utf8
    # sql_query_pre        = SET SESSION query_cache_type=OFF


    # main document fetch query
    # mandatory, integer document ID field MUST be the first selected column
    sql_query        = \
        SELECT id, group_id, UNIX_TIMESTAMP(date_added) AS date_added, title, content \
        FROM documents


    # joined/payload field fetch query
    # joined fields let you avoid (slow) JOIN and GROUP_CONCAT
    # payload fields let you attach custom per-keyword values (eg. for ranking)
    #
    # syntax is FIELD-NAME 'from'  ( 'query' | 'payload-query' ); QUERY
    # joined field QUERY should return 2 columns (docid, text)
    # payload field QUERY should return 3 columns (docid, keyword, weight)
    #
    # REQUIRES that query results are in ascending document ID order!
    # multi-value, optional, default is empty list of queries
    #
    # sql_joined_field    = tags from query; SELECT docid, CONCAT('tag',tagid) FROM tags ORDER BY docid ASC
    # sql_joined_field    = wtags from payload-query; SELECT docid, tag, tagweight FROM tags ORDER BY docid ASC


    # file based field declaration
    #
    # content of this field is treated as a file name
    # and the file gets loaded and indexed in place of a field
    #
    # max file size is limited by max_file_field_buffer indexer setting
    # file IO errors are non-fatal and get reported as warnings
    #
    # sql_file_field        = content_file_path


    # range query setup, query that must return min and max ID values
    # optional, default is empty
    #
    # sql_query will need to reference $start and $end boundaries
    # if using ranged query:
    #
    # sql_query        = \
    #    SELECT doc.id, doc.id AS group, doc.title, doc.data \
    #    FROM documents doc \
    #    WHERE id>=$start AND id<=$end
    # 区间查询 防止锁表 查询出对小的ID 和最大的ID
    # sql_query_range        = SELECT MIN(id),MAX(id) FROM documents
    # range query step
    # optional, default is 1024
    # 在最大和最小的ID中 加入步长默认1024 下面注释的是1000
    # sql_range_step        = 1000
　　 #ID=(1,2550) query=(1,1000),(1001,2000),(2001,2550) 3 angin
　　 # sql_query = SELECT * FROM documents WHERE id>=$start AND id<=$end

    # unsigned integer attribute declaration
    # multi-value (an arbitrary number of attributes is allowed), optional
    # optional bit size can be specified, default is 32
    #
    # sql_attr_uint        = author_id
    # sql_attr_uint        = forum_id:9 # 9 bits for forum_id
    sql_attr_uint        = group_id

    # boolean attribute declaration
    # multi-value (an arbitrary number of attributes is allowed), optional
    # equivalent to sql_attr_uint with 1-bit size
    #
    # sql_attr_bool        = is_deleted


    # bigint attribute declaration
    # multi-value (an arbitrary number of attributes is allowed), optional
    # declares a signed (unlike uint!) 64-bit attribute
    #
    # sql_attr_bigint        = my_bigint_id


    # UNIX timestamp attribute declaration
    # multi-value (an arbitrary number of attributes is allowed), optional
    # similar to integer, but can also be used in date functions
    #
    # sql_attr_timestamp    = posted_ts
    # sql_attr_timestamp    = last_edited_ts
    sql_attr_timestamp    = date_added


    # floating point attribute declaration
    # multi-value (an arbitrary number of attributes is allowed), optional
    # values are stored in single precision, 32-bit IEEE 754 format
    #
    # sql_attr_float        = lat_radians
    # sql_attr_float        = long_radians


    # multi-valued attribute (MVA) attribute declaration
    # multi-value (an arbitrary number of attributes is allowed), optional
    # MVA values are variable length lists of unsigned 32-bit integers
    #
    # syntax is ATTR-TYPE ATTR-NAME 'from' SOURCE-TYPE [;QUERY] [;RANGE-QUERY]
    # ATTR-TYPE is 'uint' or 'timestamp'
    # SOURCE-TYPE is 'field', 'query', or 'ranged-query'
    # QUERY is SQL query used to fetch all ( docid, attrvalue ) pairs
    # RANGE-QUERY is SQL query used to fetch min and max ID values, similar to 'sql_query_range'
    #
    # sql_attr_multi        = uint tag from query; SELECT docid, tagid FROM tags
    # sql_attr_multi        = uint tag from ranged-query; \
    #    SELECT docid, tagid FROM tags WHERE id>=$start AND id<=$end; \
    #    SELECT MIN(docid), MAX(docid) FROM tags


    # string attribute declaration
    # multi-value (an arbitrary number of these is allowed), optional
    # lets you store and retrieve strings
    #
    # sql_attr_string        = stitle


    # JSON attribute declaration
    # multi-value (an arbitrary number of these is allowed), optional
    # lets you store a JSON document as an (in-memory) attribute for later use
    #
    # sql_attr_json        = properties


    # combined field plus attribute declaration (from a single column)
    # stores column as an attribute, but also indexes it as a full-text field
    #
    # sql_field_string    = author

    
    # post-query, executed on sql_query completion
    # optional, default is empty
    # sql_query_post查询完后的操作 比如做清理操作
    # sql_query_post        =
    /**
　　　#这是注释信息
　　　sql_query_post 和 sql_query_post_index different?

前者是当Sphinx从数据库中得到数据后，立刻就会运行，而后者只有当索引真正成功建立后才会运行，这个区别还是很重要的。对于真正严格的程序，不应该在sql_query_pre和sql_query_post中更新增量时间，而应该在sql_query_post_index中更新增量时间。还有一个区别是sql_query_post和sql_query_post_index是存在与两个不同的tcp连接中，因为Sphinx从数据库中得到数据后去建索引，将会花费很长时间，所以它会将数据库连接关闭，等到索引建好之后，再去连接数据库，所以sql_query_post_index会在另一个连接中**/

    # post-index-query, executed on successful indexing completion
    # optional, default is empty
    # $maxid expands to max document ID actually fetched from DB
    # 以执行任何必要的最后的清理; 下面就是插入索引的最大值     # sql_query_post_index = REPLACE INTO counters ( id, val ) \
    # VALUES ( 'max_indexed_id', $maxid )


    # ranged query throttling, in milliseconds
    # optional, default is 0 which means no delay
    # enforces given delay before each query step
    sql_ranged_throttle    = 0 # kill-list query, fetches the document IDs for kill-list
    # k-list will suppress matches from preceding indexes in the same query
    # optional, default is empty
    #     # sql_query_killlist = SELECT id FROM documents WHERE edited>=@last_reindex


    # columns to unpack on indexer side when indexing
    # multi-value, optional, default is empty list
    #     # unpack_zlib = zlib_column
    # unpack_mysqlcompress = compressed_column
    # unpack_mysqlcompress = compressed_column_2


    # maximum unpacked length allowed in MySQL COMPRESS() unpacker
    # optional, default is 16M
    #     # unpack_mysqlcompress_maxsize = 16M


    # hook command to run when SQL connection succeeds
    # optional, default value is empty (do nothing)
    #     # hook_connect = bash sql_connect.sh


    # hook command to run after (any) SQL range query
    # it may print out "minid maxid" (w/o quotes) to override the range
    # optional, default value is empty (do nothing)
    #     # hook_query_range = bash sql_query_range.sh


    # hook command to run on successful indexing completion
    # $maxid expands to max document ID actually fetched from DB
    # optional, default value is empty (do nothing)
    #     # hook_post_index = bash sql_post_index.sh $maxid

    #####################################################################
    ## xmlpipe2 settings
    #####################################################################

    # type = xmlpipe

    # shell command to invoke xmlpipe stream producer
    # mandatory
    #     # xmlpipe_command = cat /var/test.xml

    # xmlpipe2 field declaration
    # multi-value, optional, default is empty
    #     # xmlpipe_field = subject
    # xmlpipe_field = content


    # xmlpipe2 attribute declaration
    # multi-value, optional, default is empty
    # all xmlpipe_attr_XXX options are fully similar to sql_attr_XXX
    # examples:
    #     # xmlpipe_attr_timestamp = published
    # xmlpipe_attr_uint = author_id
    # xmlpipe_attr_bool = is_enabled
    # xmlpipe_attr_float = latitude
    # xmlpipe_attr_bigint = guid
    # xmlpipe_attr_multi = tags
    # xmlpipe_attr_multi_64 = tags64
    # xmlpipe_attr_string = title
    # xmlpipe_attr_json = extra_data
    # xmlpipe_field_string = content


    # perform UTF-8 validation, and filter out incorrect codes
    # avoids XML parser choking on non-UTF-8 documents
    # optional, default is 0
    #     # xmlpipe_fixup_utf8 = 1
} # inherited source example # # all the parameters are copied from the parent source, # and may then be overridden in this source definition
source src1throttled : src1 { sql_ranged_throttle = 100 } ############################################################################# ## index definition #############################################################################

# local index example # # this is an index which is stored locally in the filesystem # # all indexing-time options (such as morphology and charsets) # are configured per local index
index test1 { # index type
    # optional, default is 'plain'
    # known values are 'plain', 'distributed', and 'rt' (see samples below)
    # type = plain

    # document source(s) to index
    # multi-value, mandatory
    # document IDs must be globally unique across all sources
    source            = src1 # index files path and file name, without extension
    # mandatory, path must be writable, extensions will be auto-appended
    path            = /var/data/test1 # document attribute values (docinfo) storage mode
    # optional, default is 'extern'
    # known values are 'none', 'extern' and 'inline'
    docinfo            = extern # dictionary type, 'crc' or 'keywords'
    # crc is faster to index when no substring/wildcards searches are needed
    # crc with substrings might be faster to search but is much slower to index
    # (because all substrings are pre-extracted as individual keywords)
    # keywords is much faster to index with substrings, and index is much (3-10x) smaller
    # keywords supports wildcards, crc does not, and never will
    # optional, default is 'keywords'
    dict            = keywords # memory locking for cached data (.spa and .spi), to prevent swapping
    # optional, default is 0 (do not mlock)
    # requires searchd to be run from root
    mlock            = 0 # a list of morphology preprocessors to apply
    # optional, default is empty
    #     # builtin preprocessors are 'none', 'stem_en', 'stem_ru', 'stem_enru',
    # 'soundex', and 'metaphone'; additional preprocessors available from
    # libstemmer are 'libstemmer_XXX', where XXX is algorithm code
    # (see libstemmer_c/libstemmer/modules.txt)
    #     # morphology = stem_en, stem_ru, soundex
    # morphology = libstemmer_german
    # morphology = libstemmer_sv
    morphology        = none # minimum word length at which to enable stemming
    # optional, default is 1 (stem everything)
    #     # min_stemming_len = 1


    # stopword files list (space separated)
    # optional, default is empty
    # contents are plain text, charset_table and stemming are both applied
    #     # stopwords = /var/data/stopwords.txt


    # wordforms file, in "mapfrom > mapto" plain text format
    # optional, default is empty
    #     # wordforms = /var/data/wordforms.txt


    # tokenizing exceptions file
    # optional, default is empty
    #     # plain text, case sensitive, space insensitive in map-from part
    # one "Map Several Words => ToASingleOne" entry per line
    #     # exceptions = /var/data/exceptions.txt


    # embedded file size limit
    # optional, default is 16K
    #     # exceptions, wordforms, and stopwords files smaller than this limit
    # are stored in the index; otherwise, their paths and sizes are stored
    #     # embedded_limit = 16K

    # minimum indexed word length
    # default is 1 (index everything)
    min_word_len        = 1


    # ignored characters list
    # optional, default value is empty
    #     # ignore_chars = U+00AD


    # minimum word prefix length to index
    # optional, default is 0 (do not index prefixes)
    #     # min_prefix_len = 0


    # minimum word infix length to index
    # optional, default is 0 (do not index infixes)
    #     # min_infix_len = 0


    # maximum substring (prefix or infix) length to index
    # optional, default is 0 (do not limit substring length)
    #     # max_substring_len = 8


    # list of fields to limit prefix/infix indexing to
    # optional, default value is empty (index all fields in prefix/infix mode)
    #     # prefix_fields = filename
    # infix_fields = url, domain


    # expand keywords with exact forms and/or stars when searching fit indexes
    # search-time only, does not affect indexing, can be 0 or 1
    # optional, default is 0 (do not expand keywords)
    #     # expand_keywords = 1

    
    # n-gram length to index, for CJK indexing
    # only supports 0 and 1 for now, other lengths to be implemented
    # optional, default is 0 (disable n-grams)
    #     # ngram_len = 1


    # n-gram characters list, for CJK indexing
    # optional, default is empty
    #     # ngram_chars = U+3000..U+2FA1F


    # phrase boundary characters list
    # optional, default is empty
    #     # phrase_boundary = ., ?, !, U+2026 # horizontal ellipsis


    # phrase boundary word position increment
    # optional, default is 0
    #     # phrase_boundary_step = 100


    # blended characters list
    # blended chars are indexed both as separators and valid characters
    # for instance, AT&T will results in 3 tokens ("at", "t", and "at&t")
    # optional, default is empty
    #     # blend_chars = +, &, U+23


    # blended token indexing mode
    # a comma separated list of blended token indexing variants
    # known variants are trim_none, trim_head, trim_tail, trim_both, skip_pure
    # optional, default is trim_none
    #     # blend_mode = trim_tail, skip_pure


    # whether to strip HTML tags from incoming documents
    # known values are 0 (do not strip) and 1 (do strip)
    # optional, default is 0
    html_strip        = 0 # what HTML attributes to index if stripping HTML
    # optional, default is empty (do not index anything)
    #     # html_index_attrs = img=alt,title; a=title;


    # what HTML elements contents to strip
    # optional, default is empty (do not strip element contents)
    #     # html_remove_elements = style, script


    # whether to preopen index data files on startup
    # optional, default is 0 (do not preopen), searchd-only
    #     # preopen = 1


    # whether to enable in-place inversion (2x less disk, 90-95% speed)
    # optional, default is 0 (use separate temporary files), indexer-only
    #     # inplace_enable = 1


    # in-place fine-tuning options
    # optional, defaults are listed below
    #     # inplace_hit_gap = 0 # preallocated hitlist gap size
    # inplace_docinfo_gap = 0 # preallocated docinfo gap size
    # inplace_reloc_factor = 0.1 # relocation buffer size within arena
    # inplace_write_factor = 0.1 # write buffer size within arena


    # whether to index original keywords along with stemmed versions
    # enables "=exactform" operator to work
    # optional, default is 0
    #     # index_exact_words = 1


    # position increment on overshort (less that min_word_len) words
    # optional, allowed values are 0 and 1, default is 1
    #     # overshort_step = 1


    # position increment on stopword
    # optional, allowed values are 0 and 1, default is 1
    #     # stopword_step = 1


    # hitless words list
    # positions for these keywords will not be stored in the index
    # optional, allowed values are 'all', or a list file name
    #     # hitless_words = all
    # hitless_words = hitless.txt


    # detect and index sentence and paragraph boundaries
    # required for the SENTENCE and PARAGRAPH operators to work
    # optional, allowed values are 0 and 1, default is 0
    #     # index_sp = 1


    # index zones, delimited by HTML/XML tags
    # a comma separated list of tags and wildcards
    # required for the ZONE operator to work
    # optional, default is empty string (do not index zones)
    #     # index_zones = title, h*, th


    # index per-document and average per-index field lengths, in tokens
    # required for the BM25A(), BM25F() in expression ranker
    # optional, default is 0 (do not index field lenghts)
    #     # index_field_lengths = 1


    # regular expressions (regexps) to filter the fields and queries with
    # gets applied to data source fields when indexing
    # gets applied to search queries when searching
    # multi-value, optional, default is empty list of regexps
    #     # regexp_filter = \b(\d+)\" => \1inch
    # regexp_filter = (blue|red) => color


    # list of the words considered frequent with respect to bigram indexing
    # optional, default is empty
    #     # bigram_freq_words = the, a, i, you, my


    # bigram indexing mode
    # known values are none, all, first_freq, both_freq
    # option, default is none (do not index bigrams)
    #     # bigram_index = both_freq


    # snippet document file name prefix
    # preprended to file names when generating snippets using load_files option
    # WARNING, this is a prefix (not a path), trailing slash matters!
    # optional, default is empty
    #     # snippets_file_prefix = /mnt/mydocs/server1


    # whether to apply stopwords before or after stemming
    # optional, default is 0 (apply stopwords after stemming)
    #     # stopwords_unstemmed = 0


    # path to a global (cluster-wide) keyword IDFs file
    # optional, default is empty (use local IDFs)
    #     # global_idf = /usr/local/sphinx/var/global.idf
} # inherited index example # # all the parameters are copied from the parent index, # and may then be overridden in this index definition
index test1stemmed : test1 { path = /var/data/test1stemmed morphology = stem_en } # distributed index example # # this is a virtual index which can NOT be directly indexed, # and only contains references to other local and/or remote indexes
index dist1 { # 'distributed' index type MUST be specified
    type            = distributed # local index to be searched
    # there can be many local indexes configured
    local            = test1 local = test1stemmed # remote agent
    # multiple remote agents may be specified
    # syntax for TCP connections is 'hostname:port:index1,[index2[,...]]'
    # syntax for local UNIX connections is '/path/to/socket:index1,[index2[,...]]'
    agent            = localhost:9313:remote1 agent = localhost:9314:remote2,remote3 # agent = /var/run/searchd.sock:remote4

    # remote agent mirrors groups, aka mirrors, aka HA agents
    # defines 2 or more interchangeable mirrors for a given index part
    #     # agent = server3:9312 | server4:9312 :indexchunk2
    # agent = server3:9312:chunk2server3 | server4:9312:chunk2server4
    # agent = server3:chunk2server3 | server4:chunk2server4
    # agent = server21|server22|server23:chunk2


    # blackhole remote agent, for debugging/testing
    # network errors and search results will be ignored
    #     # agent_blackhole = testbox:9312:testindex1,testindex2


    # persistenly connected remote agent
    # reduces connect() pressure, requires that workers IS threads
    #     # agent_persistent = testbox:9312:testindex1,testindex2


    # remote agent connection timeout, milliseconds
    # optional, default is 1000 ms, ie. 1 sec
    agent_connect_timeout    = 1000

    # remote agent query timeout, milliseconds
    # optional, default is 3000 ms, ie. 3 sec
    agent_query_timeout        = 3000

    # HA mirror agent strategy
    # optional, defaults to ??? (random mirror)
    # know values are nodeads, noerrors, roundrobin, nodeadstm, noerrorstm
    #     # ha_strategy = nodeads

    # path to RLP context file
    # optional, defaut is empty
    #     # rlp_context = /usr/local/share/sphinx/rlp/rlp-context.xml
} # realtime index example # # you can run INSERT, REPLACE, and DELETE on this index on the fly # using MySQL protocol (see 'listen' directive below)
index rt { # 'rt' index type must be specified to use RT index
    type            = rt # index files path and file name, without extension
    # mandatory, path must be writable, extensions will be auto-appended
    path            = /var/data/rt # RAM chunk size limit
    # RT index will keep at most this much data in RAM, then flush to disk
    # optional, default is 128M
    #     # rt_mem_limit = 512M

    # full-text field declaration
    # multi-value, mandatory
    rt_field        = title rt_field = content # unsigned integer attribute declaration
    # multi-value (an arbitrary number of attributes is allowed), optional
    # declares an unsigned 32-bit attribute
    rt_attr_uint        = gid # RT indexes currently support the following attribute types:
    # uint, bigint, float, timestamp, string, mva, mva64, json
    #     # rt_attr_bigint = guid
    # rt_attr_float = gpa
    # rt_attr_timestamp = ts_added
    # rt_attr_string = author
    # rt_attr_multi = tags
    # rt_attr_multi_64 = tags64
    # rt_attr_json = extra_data
} ############################################################################# ## indexer settings #############################################################################
 indexer { # memory limit, in bytes, kiloytes (16384K) or megabytes (256M)
    # optional, default is 128M, max is 2047M, recommended is 256M to 1024M
    mem_limit        = 128M # maximum IO calls per second (for I/O throttling)
    # optional, default is 0 (unlimited)
    #     # max_iops = 40


    # maximum IO call size, bytes (for I/O throttling)
    # optional, default is 0 (unlimited)
    #     # max_iosize = 1048576


    # maximum xmlpipe2 field length, bytes
    # optional, default is 2M
    #     # max_xmlpipe2_field = 4M


    # write buffer size, bytes
    # several (currently up to 4) buffers will be allocated
    # write buffers are allocated in addition to mem_limit
    # optional, default is 1M
    #     # write_buffer = 1M


    # maximum file field adaptive buffer size
    # optional, default is 8M, minimum is 1M
    #     # max_file_field_buffer = 32M


    # how to handle IO errors in file fields
    # known values are 'ignore_field', 'skip_document', and 'fail_index'
    # optional, default is 'ignore_field'
    #     # on_file_field_error = skip_document


    # lemmatizer cache size
    # improves the indexing time when the lemmatization is enabled
    # optional, default is 256K
    #     # lemmatizer_cache = 512M
} ############################################################################# ## searchd settings #############################################################################
 searchd { # [hostname:]port[:protocol], or /unix/socket/path to listen on
    # known protocols are 'sphinx' (SphinxAPI) and 'mysql41' (SphinxQL)
    #     # multi-value, multiple listen points are allowed
    # optional, defaults are 9312:sphinx and 9306:mysql41, as below
    #     # listen = 127.0.0.1
    # listen = 192.168.0.1:9312
    # listen = 9312
    # listen = /var/run/searchd.sock
    listen            = 9312 listen = 9306:mysql41 # log file, searchd run info is logged here
    # optional, default is 'searchd.log'
    log            = /var/log/searchd.log # query log file, all search queries are logged here
    # optional, default is empty (do not log queries)
    query_log        = /var/log/query.log # client read timeout, seconds
    # optional, default is 5
    read_timeout        = 5

    # request timeout, seconds
    # optional, default is 5 minutes
    client_timeout        = 300

    # maximum amount of children to fork (concurrent searches to run)
    # optional, default is 0 (unlimited)
    max_children        = 30

    # maximum amount of persistent connections from this master to each agent host
    # optional, but necessary if you use agent_persistent. It is reasonable to set the value
    # as max_children, or less on the agent's hosts.
    persistent_connections_limit    = 30

    # PID file, searchd process ID file name
    # mandatory
    pid_file        = /var/log/searchd.pid # seamless rotate, prevents rotate stalls if precaching huge datasets
    # optional, default is 1
    seamless_rotate        = 1

    # whether to forcibly preopen all indexes on startup
    # optional, default is 1 (preopen everything)
    preopen_indexes        = 1

    # whether to unlink .old index copies on succesful rotation.
    # optional, default is 1 (do unlink)
    unlink_old        = 1

    # attribute updates periodic flush timeout, seconds
    # updates will be automatically dumped to disk this frequently
    # optional, default is 0 (disable periodic flush)
    #     # attr_flush_period = 900


    # MVA updates pool size
    # shared between all instances of searchd, disables attr flushes!
    # optional, default size is 1M
    mva_updates_pool    = 1M # max allowed network packet size
    # limits both query packets from clients, and responses from agents
    # optional, default size is 8M
    max_packet_size        = 8M # max allowed per-query filter count
    # optional, default is 256
    max_filters        = 256

    # max allowed per-filter values count
    # optional, default is 4096
    max_filter_values    = 4096


    # socket listen queue length
    # optional, default is 5
    #     # listen_backlog = 5


    # per-keyword read buffer size
    # optional, default is 256K
    #     # read_buffer = 256K


    # unhinted read size (currently used when reading hits)
    # optional, default is 32K
    #     # read_unhinted = 32K


    # max allowed per-batch query count (aka multi-query count)
    # optional, default is 32
    max_batch_queries    = 32


    # max common subtree document cache size, per-query
    # optional, default is 0 (disable subtree optimization)
    #     # subtree_docs_cache = 4M


    # max common subtree hit cache size, per-query
    # optional, default is 0 (disable subtree optimization)
    #     # subtree_hits_cache = 8M


    # multi-processing mode (MPM)
    # known values are none, fork, prefork, and threads
    # threads is required for RT backend to work
    # optional, default is threads
    workers            = threads # for RT to work


    # max threads to create for searching local parts of a distributed index
    # optional, default is 0, which means disable multi-threaded searching
    # should work with all MPMs (ie. does NOT require workers=threads)
    #     # dist_threads = 4


    # binlog files path; use empty string to disable binlog
    # optional, default is build-time configured data directory
    #     # binlog_path = # disable logging
    # binlog_path = /var/data # binlog.001 etc will be created there


    # binlog flush/sync mode
    # 0 means flush and sync every second
    # 1 means flush and sync every transaction
    # 2 means flush every transaction, sync every second
    # optional, default is 2
    #     # binlog_flush = 2


    # binlog per-file size limit
    # optional, default is 128M, 0 means no limit
    #     # binlog_max_log_size = 256M


    # per-thread stack size, only affects workers=threads mode
    # optional, default is 64K
    #     # thread_stack = 128K


    # per-keyword expansion limit (for dict=keywords prefix searches)
    # optional, default is 0 (no limit)
    #     # expansion_limit = 1000


    # RT RAM chunks flush period
    # optional, default is 0 (no periodic flush)
    #     # rt_flush_period = 900


    # query log file format
    # optional, known values are plain and sphinxql, default is plain
    #     # query_log_format = sphinxql


    # version string returned to MySQL network protocol clients
    # optional, default is empty (use Sphinx version)
    #     # mysql_version_string = 5.0.37


    # default server-wide collation
    # optional, default is libc_ci
    #     # collation_server = utf8_general_ci


    # server-wide locale for libc based collations
    # optional, default is C
    #     # collation_libc_locale = ru_RU.UTF-8


    # threaded server watchdog (only used in workers=threads mode)
    # optional, values are 0 and 1, default is 1 (watchdog on)
    #     # watchdog = 1

    
    # costs for max_predicted_time model, in (imaginary) nanoseconds
    # optional, default is "doc=64, hit=48, skip=2048, match=64"
    #     # predicted_time_costs = doc=64, hit=48, skip=2048, match=64


    # current SphinxQL state (uservars etc) serialization path
    # optional, default is none (do not serialize SphinxQL state)
    #     # sphinxql_state = sphinxvars.sql


    # maximum RT merge thread IO calls per second, and per-call IO size
    # useful for throttling (the background) OPTIMIZE INDEX impact
    # optional, default is 0 (unlimited)
    #     # rt_merge_iops = 40
    # rt_merge_maxiosize = 1M


    # interval between agent mirror pings, in milliseconds
    # 0 means disable pings
    # optional, default is 1000
    #     # ha_ping_interval = 0


    # agent mirror statistics window size, in seconds
    # stats older than the window size (karma) are retired
    # that is, they will not affect master choice of agents in any way
    # optional, default is 60 seconds
    #     # ha_period_karma = 60


    # delay between preforked children restarts on rotation, in milliseconds
    # optional, default is 0 (no delay)
    #     # prefork_rotation_throttle = 100


    # a prefix to prepend to the local file names when creating snippets
    # with load_files and/or load_files_scatter options
    # optional, default is empty
    #     # snippets_file_prefix = /mnt/common/server1/
} ############################################################################# ## common settings #############################################################################
 common { # lemmatizer dictionaries base path
    # optional, defaut is /usr/local/share (see ./configure --datadir)
    #     # lemmatizer_base = /usr/local/share/sphinx/dicts


    # how to handle syntax errors in JSON attributes
    # known values are 'ignore_attr' and 'fail_index'
    # optional, default is 'ignore_attr'
    #     # on_json_attr_error = fail_index


    # whether to auto-convert numeric values from strings in JSON attributes
    # with auto-conversion, string value with actually numeric data
    # (as in {"key":"12345"}) gets stored as a number, rather than string
    # optional, allowed values are 0 and 1, default is 0 (do not convert)
    #     # json_autoconv_numbers = 1


    # whether and how to auto-convert key names in JSON attributes
    # known value is 'lowercase'
    # optional, default is unspecified (do nothing)
    #     # json_autoconv_keynames = lowercase


    # path to RLP root directory
    # optional, defaut is /usr/local/share (see ./configure --datadir)
    #     # rlp_root = /usr/local/share/sphinx/rlp


    # path to RLP environment file
    # optional, defaut is /usr/local/share/rlp-environment.xml (see ./configure --datadir)
    #     # rlp_environment = /usr/local/share/sphinx/rlp/rlp/etc/rlp-environment.xml


    # maximum total size of documents batched before processing them by the RLP
    # optional, default is 51200
    #     # rlp_max_batch_size = 100k


    # maximum number of documents batched before processing them by the RLP
    # optional, default is 50
    #     # rlp_max_batch_docs = 100


    # trusted plugin directory
    # optional, default is empty (disable UDFs)
    #     # plugin_dir = /usr/local/sphinx/lib
 } # --eof--

你可能感兴趣的:(Sphinx之配置文件)

【K8s】专题十六（3）：Kubernetes 包管理工具之 Helm 语法行者Sun1989 Kubernetes kubernetes 容器云原生 Helm
本文内容均来自个人笔记并重新梳理，如有错误欢迎指正！如果对您有帮助，烦请点赞、关注、转发、订阅专栏！专栏订阅入口|精选文章|Kubernetes|Docker|Linux|羊毛资源|工具推荐|往期精彩文章【Docker】（全网首发）KylinV10下MySQL容器内存占用异常的解决方法【Docker】（全网首发）KylinV10下MySQL容器内存占用异常的解决方法（续）【K8s】专题十六（2）：
SpringBoot 根据配置前缀绑定配置：@ConfigurationProperties JiaHao汤 SpringBoot spring boot 后端 java springboot
文章目录内部Bean配置绑定第三方Bean配置绑定@ConfigurationProperties是Spring在org.springframework.boot.context.properties包中提供的一个注解。它的作用是根据注解中配置的前缀对SpringBoot配置文件（即application.xxx）中前缀相同的配置进行属性绑定。对于@ConfigurationProperties注
Python爬虫学习笔记_DAY_26_Python爬虫之requests库的安装与基本使用【Python爬虫】_requests库ip 苹果Android开发组程序员 python 爬虫学习
最后Python崛起并且风靡，因为优点多、应用领域广、被大牛们认可。学习Python门槛很低，但它的晋级路线很多，通过它你能进入机器学习、数据挖掘、大数据，CS等更加高级的领域。Python可以做网络应用，可以做科学计算，数据分析，可以做网络爬虫，可以做机器学习、自然语言处理、可以写游戏、可以做桌面应用…Python可以做的很多，你需要学好基础，再选择明确的方向。这里给大家分享一份全套的Pytho
Ubuntu18.04系统新手入门糖糖不是堂 ubuntu linux ubuntu
Ubuntu18.04系统新手入门Ubuntu系统介绍Ubuntu系统与Windows系统的区别介绍Ubuntu之灵魂：命令行语句常用启动终端的方法：我的Ubuntu18.04系统入门下载支持Linux系统的deb文件并安装Linux文件管理对比Windows系统常用Linux系统快捷键Ubuntu编程入门第一个C++程序：hello.cpp关于Ubuntu中程序存储位置使用vim或CodeBlo
linux 设置固定内网ip supermiketho linux tcp/ip 服务器
设置内网固定Ip创建络配置文件：/etc/sysconfig/network-scripts/ifcfg-ens196(这个名字是根据实际来的)TYPE=EthernetPROXY_METHOD=noneBROWSER_ONLY=noBOOTPROTO=noneDEFROUTE=yesIPV4_FAILURE_FATAL=noIPV6INIT=yesIPV6_AUTOCONF=yesIPV6_DE
MyBatis 的核心配置文件是干什么的？它的结构是怎样的？哪些是必须配置的，哪些是可选的？冰糖心书房 Mybatis 源码系列 mybatis
MyBatis的核心配置文件（通常命名为mybatis-config.xml）是MyBatis应用程序的入口点，它定义了MyBatis的全局配置信息。核心配置文件的作用：配置MyBatis的运行时行为:通过标签设置全局参数，控制MyBatis的各种行为，例如是否开启缓存、是否使用延迟加载、是否自动映射等。配置数据源和事务管理器:通过标签配置数据库连接信息和事务管理方式。注册类型别名:通过标签为Ja
AI编程方法第二弹：边提问边调整 leeshuqing AI编程 AI编程
AI编程的提问词非常类似于传统搜索引擎中的检索词，虽然采取了自然语言表示，但是在获取结果的策略上却很一致。因为用户在一开始可能并不非常清楚AI编程工具如何理解用户的提问，因此输出结果可能并不能完全满足用户要求，此时用户可以不断的根据生成结果，动态的灵活的调整提问，使之不断趋近于自己满意的结果。比如，对于“Python”等任意英文单词，允许用户指定总宽度后，通过自动填充空格，使之总宽度尽可能等于该宽
从零开始搭建搜索推荐系统（五十四）多路召回之万剑归宗 hanyi_ 搜索推荐 java java 搜索系统
聊的不止技术。跟着小帅写代码，还原和技术大牛一对一真实对话，剖析真实项目筑成的一砖一瓦，了解最新最及时的资讯信息，还可以学到日常撩妹小技巧哦，让我们开始探索主人公小帅的职场生涯吧！（PS：本系列文章以幽默风趣风格为主，较真侠和杠精请绕道~）一、奶茶引发的血案（会议室里，行服小姐姐把笔记本往桌上一拍，屏幕上是密密麻麻的搜索日志）行服姐姐："小帅！你自己看看！用户搜'朝阳区低糖芝士草莓冰沙'，你家系统
Neo4j之CQL基础风云诀4 图数据库知识图谱大数据人工智能
Neo4j之CQL基础文章目录Neo4j之CQL基础一、CQL概念二、CQL简介三、CQL命令使用creatematch+returnwheredeleteremovesetorderbymerge四、CQL函数使用StringAggregationRelationship一、CQL概念关系型数据库的查询语言是SQL，Neo4j图数据库也有自己的查询语言，那就是CQL。CQL全称CypherQue
Kotlin学习笔记之基础知识 mercyT kotlin 学习笔记
本内容是建立在有java的基础上去学习Kotlin的这门语言的，所以更多的是记录一些与java不同的之处，或者是Kotlin的特性等。基本类型在Kotlin中，所有东西都是对象，在这个意义上讲我们可以在任何变量上调用成员函数和属性。一些类型可以有特殊的内部表示——例如，数字、字符和布尔值可以在运行时表示为原生类型值，但是对于用户来说，它们看起来就像普通的类。在本节中，我们会描述Kotlin中使用的
InSAR个人笔记（三）ISCE之DInSAR处理--topsApp.py 玊363 笔记
数据下载1、哨兵1slc数据下载研究区的选定：首先确定研究区内的范围（经纬度），其次确定下载数据的时间，最后保证两张SAR影像是重复轨道拍摄的（哨兵单颗卫星时间周期为12天，星座为24天）（1）下载网址：SAF：https://search.asf.alaska.edu/#/?zoom=5.000¢er=123.354,25.990https://search.asf.alaska.edu/#/?
fastfds文件服务器搭建酸辣菜菜鱼 linux nginx fastdfs java
文章目录1.fastfds文件服务器搭建1.1环境准备1.2环境编译1.3磁盘目录1.4安装libfascommon1.5安装FastDFS1.6安装fastdfs-nginx-module1.7安装nginx1.8配置文件1.8.1tracker配置1.8.2storage配置1.8.3配置nginx2启动2.1关闭防火墙2.2启动tracker2.3启动storage2.4启动nginx2.4
Python 之进阶学习 _ZestyJt Python python 学习
学习Python之进阶学习一切皆对象1.变量和函数皆对象2.模块和类皆对象3.对象的基本操作(1).可以赋值给变量(2).可以添加到集合中(3).可以作为函数参数(4).可以作为函数返回值返回4.object,type,class之间的关系(1).object类(2).type类和type对象闭包1.查看闭包(1).查看闭包(2).查看环境变量2.分析闭包3.闭包的用处Lambda表达式1.匿名函
TouchGFX之MVP Stone_lu。 STM32 arm开发
TouchGFX用户接口遵循Model-View-Presenter（MVP）架构模式，它是Model-View-Controller（MVC）模式的派生模式。两者都广泛用于构建用户接口应用。MVP模式的主要优势是：关注点分离：将代码分成不同的部分提供，每部分有自己的任务。这使得代码更简单、可重复使用性更高且更易于维护。单元测试：由于UI的逻辑（Presenter）独立于视图（View），因此，单
构建服务端证书校验鸿蒙示例代码
本文原创发布在华为开发者社区。介绍该示例是一个连接网络的Demo,通过socket获取远端证书，在网络通信中，利用套接字（socket）技术来获取与之建立连接的远端服务器的数字证书。构建服务端证书校验源码链接效果预览使用说明打开应用后，点击“点击连接”按钮，获取与之建立连接的远端服务器的数字证书，在后台打印数据。实现思路获取本地ipfunctiongetLocalIp(){constipInfo=
鸿蒙开发-一多开发之断点布局川石教育鸿蒙开发 harmonyos 鸿蒙开发鸿蒙课程培训鸿蒙开发培训鸿蒙开发教程
在HarmonyOS的ArkTS语法中，断点布局是一种用于响应不同屏幕尺寸和设备类型的布局技术。以下是一个简单的断点布局实例，不涉及媒体查询，仅使用ArkTS的内置功能和组件来实现。import{BreakpointSystem,BreakpointConstants}from'@ohos/arkui';@Entry@ComponentstructBreakpointLayoutDemo{priv
Leetcode之随机数索引一只荣 leetcode和机试题 leetcode
题目：给定一个可能含有重复元素的整数数组，要求随机输出给定的数字的索引。您可以假设给定的数字一定存在于数组中。注意：数组大小可能非常大。使用太多额外空间的解决方案将不会通过测试。示例:int[]nums=newint[]{1,2,3,3,3};Solutionsolution=newSolution(nums);solution.pick(3);solution.pick(1);代码：方法一——暴
【云原生之Docker实战】使用Docker部署MongoDB数据库管理工具Mongo-Express 江湖有缘 docker 云原生 Mongo-Express
【云原生之Docker实战】使用Docker部署MongoDB数据库管理工具Mongo-Express一、Mongo-Express介绍1.Mongo-Express简介2.MongoDB简介二、检查本地系统环境1.检查系统版本2.检查docker状态3.检查docker版本三、安装docker-compose1.下载docker-compose二进制包2.给文件增加执行权限3.检查docker-
(4-8)基于DeepSeekMoE架构的DeepSeek-V3：测试模型码农三叔训练 RAG 多模态)架构 transformer deekseek 人工智能大模型
4.8测试模型DeepSeek-V3是一款基于PyTorch的深度学习模型，主要用于文本生成任务。在加载模型时，首先需要从指定路径加载模型的配置文件和预训练权重。加载完成后，模型被设置为评估模式，并移动到GPU上以加速推理过程。在生成文本时，用户可以输入提示文本，模型会根据这些提示生成相应的文本输出。生成过程支持交互式输入和批量处理两种模式，用户可以根据需要选择适合的方式进行文本生成。此外，模型的
Systemd 服务文件（service）比奇堡派星星 linux 服务器
LinuxSystemd服务文件编写指南1.概述在现代Linux系统中，systemd是默认的初始化系统，用于管理系统服务的启动、停止、重启等操作。systemd服务文件（以.service为后缀）是定义服务行为的核心配置文件。本文档将详细介绍如何编写一个systemd服务文件，包括文件结构、常用配置项、操作步骤以及注意事项。2.服务文件的作用systemd服务文件用于定义一个服务的以下行为：服务
一个基于LSTM的字符级文本生成模型的训练+使用(pytorch) 一只小铁柱 lstm pytorch 人工智能
一、代码实现1.配置文件config.pyimporttorch#设备配置DEVICE=torch.device('cuda'iftorch.cuda.is_available()else'cpu')#超参数和配置SEQ_LENGTH=100#输入序列长度BATCH_SIZE=64#批大小EMBEDDING_DIM=256#嵌入层维度HIDDEN_SIZE=512#LSTM隐藏层大小NUM_LAY
NodeJs中npm国内慢的问题解决夏木炎 npm 前端 node.js
方法一：更改npm配置文件：$npmconfigsetregistryhttp://registry.npm.taobao.orgURL即为需要设置的镜像站点地址，如淘宝镜像:http://registry.npm.taobao.org方法二：你可以使用淘宝NPM镜像定制的cnpm(gzip压缩支持)命令行工具代替默认的npm:$npminstall-gcnpm--registry=https:/
设计模式之单例模式：原理、实现与应用 wenbin_java 设计模式单例模式
引言设计模式是软件开发中解决常见问题的经典解决方案。单例模式（SingletonPattern）是其中最基础且常用的设计模式之一，主要用于确保一个类只有一个实例，并提供一个全局访问点。本文将深入探讨单例模式的原理、实现方式以及实际应用场景，帮助你更好地理解和使用这一设计模式。1.单例模式的核心概念1.1什么是单例模式？单例模式是一种创建型设计模式，它确保一个类只有一个实例，并提供一个全局访问点来访
设计模式之工厂模式周努力. 设计模式设计模式
工厂模式属于创建型设计模式的一种，其实在我看来它更是在面向对象编程语言的抽象层的更加灵活的应用。工厂模式其实在创建型模式中难度较高，整体的理解上需要一定时间进行消化，在一些Java常见框架中，这种模式也是频繁出现的设计，如果我们可以在自己的项目中灵活使用这个模式那将会让我们的代码更加灵活、耦合度会更低。此篇文章我们将工厂模式拆成三个不同的工厂形式来循序渐进地讲解，以便开发者能够深刻理解工厂设计模式
普通人怎么利用GPT赚钱之创建自动化工具贫苦游商普通人利用AI搞钱系列 gpt 自动化运维人工智能算法机器学习
利用GPT创建自动化工具：从构想到实现的详细指南在当前快速发展的科技时代，人工智能（AI）正在改变各行各业的工作方式。对于普通人来说，利用GPT（GenerativePre-trainedTransformer）这样的语言模型来创建自动化工具，并通过这些工具赚钱，已经成为一种切实可行的方法。本文将探讨普通人如何在中文平台上利用GPT创建自动化工具，从而实现盈利。什么是GPT？首先，我们需要了解什么
java基础之选择结构（if）、循环结构（for、while）篇 Rookie_lyj java基础 java 开发语言后端
前言本章主要是对选择结构（if-else）、循环结构（for、while）的练习一、选择结构判断瑞年题目要求：闰年的条件是能被4整除，但不能被100整除；或能被400整除。思路：输入要判断的年份添加条件（条件1：能被4整除，但不能被100整除，条件2：能被400整除）数据结果publicclasstest{publicstaticvoidmain(Stringargs[]){Scannerscan
【CMake指南】第1篇：CMake入门基础 JuicyActiveGilbert CMake指南 c++CMake 教程
1.什么是CMake？CMake是一个跨平台的自动化构建工具，用于管理C/C++项目的编译过程。它通过简单的配置文件（CMakeLists.txt）生成不同平台（如Windows的VisualStudio、Linux的Makefile、macOS的Xcode）所需的构建文件，解决手动编写Makefile或维护多平台项目的痛点。为什么选择CMake？跨平台支持：一套配置，多平台编译。简洁高效：语法清
CentOS7下安装MongoDB wjf63000 mongodb 数据库
步骤1：创建MongoDBYum仓库文件你需要创建一个MongoDB的Yum仓库配置文件，以便从官方源下载MongoDB。打开终端并使用以下命令创建并编辑该文件：sudovi/etc/yum.repos.d/mongodb-org-7.0.repo在打开的文件中，输入以下内容：[mongodb-org-7.0]name=MongoDBRepositorybaseurl=https://repo.m
数据中心运维之供应商管理：打造高效合作生态数据中心运维高级工程师数据库网络安全大数据
引言在当今数字化时代，数据中心的稳定、高效运行离不开各类供应商的支持，从硬件设备供应商到运维服务提供商，从软件开发商到安全解决方案供应商，供应商的管理质量直接关系到数据中心的整体运维水平和服务质量。良好的供应商管理不仅能确保数据中心的稳定运行，还能有效降低成本、提升效率、增强竞争力。因此，构建科学、规范、高效的供应商管理体系，已成为数据中心运维管理的重要课题。目的本文旨在为数据中心机房管理者提供一
C++程序设计语言笔记——引言：第三章 C++概览之抽象机制1 钺不言 C++笔记 c++笔记经验分享
C++概览：抽象机制0类C++最核心的语言特性就是类。类是一种用户自定义的数据类型，用于在程序代码中表示某种概念。无论何时，只要我们想为程序设计一个有用的概念、想法或实体，都应该设法把它表示为程序中的一个类，这样我们的想法就能表达成代码，而不是仅存在于我们的头脑中、设计文档里或者注释里。对于一个程序来说，不论是用易读性还是正确性来衡量，使用一组精挑细选的类都要比直接用内置类型完成所有任务更好，尤其
开发者关心的那些事圣子足道 ios 游戏编程 apple 支付
我要在app里添加IAP，必须要注册自己的产品标识符（product identifiers）。产品标识符是什么？产品标识符（Product Identifiers）是一串字符串，它用来识别你在应用内贩卖的每件商品。App Store用产品标识符来检索产品信息，标识符只能包含大小写字母（A-Z）、数字（0-9）、下划线（-）、以及圆点(.)。你可以任意排列这些元素，但我们建议你创建标识符时使用
负载均衡器技术Nginx和F5的优缺点对比 bijian1013 nginx F5
对于数据流量过大的网络中，往往单一设备无法承担，需要多台设备进行数据分流，而负载均衡器就是用来将数据分流到多台设备的一个转发器。目前有许多不同的负载均衡技术用以满足不同的应用需求，如软/硬件负载均衡、本地/全局负载均衡、更高
LeetCode[Math] - #9 Palindrome Number Cwind java Algorithm 题解 LeetCode Math
原题链接：#9 Palindrome Number 要求：判断一个整数是否是回文数，不要使用额外的存储空间难度：简单分析：题目限制不允许使用额外的存储空间应指不允许使用O(n)的内存空间，O(1)的内存用于存储中间结果是可以接受的。于是考虑将该整型数反转，然后与原数字进行比较。注：没有看到有关负数是否可以是回文数的明确结论，例如
画图板的基本实现 15700786134 画图板
要实现画图板的基本功能，除了在qq登陆界面中用到的组件和方法外，还需要添加鼠标监听器，和接口实现。首先，需要显示一个JFrame界面： public class DrameFrame extends JFrame { //显示
linux的ps命令被触发 linux
Linux中的ps命令是Process Status的缩写。ps命令用来列出系统中当前运行的那些进程。ps命令列出的是当前那些进程的快照，就是执行ps命令的那个时刻的那些进程，如果想要动态的显示进程信息，就可以使用top命令。要对进程进行监测和控制，首先必须要了解当前进程的情况，也就是需要查看当前进程，而 ps 命令就是最基本同时也是非常强大的进程查看命令。使用该命令可以确定有哪些进程正在运行
Android 音乐播放器下一曲连续跳几首歌肆无忌惮_ android
最近在写安卓音乐播放器的时候遇到个问题。在MediaPlayer播放结束时会回调 player.setOnCompletionListener(new OnCompletionListener() { @Override public void onCompletion(MediaPlayer mp) { mp.reset(); Log.i("H
java导出txt文件的例子知了ing java servlet
代码很简单就一个servlet,如下： package com.eastcom.servlet; import java.io.BufferedOutputStream; import java.io.IOException; import java.net.URLEncoder; import java.sql.Connection; import java.sql.Resu
Scala stack试玩, 提高第三方依赖下载速度矮蛋蛋 scala sbt
原文地址： http://segmentfault.com/a/1190000002894524 sbt下载速度实在是惨不忍睹, 需要做些配置优化下载typesafe离线包, 保存为ivy本地库 wget http://downloads.typesafe.com/typesafe-activator/1.3.4/typesafe-activator-1.3.4.zip 解压r
phantomjs安装(linux，附带环境变量设置) ，以及casperjs安装。 alleni123 linux spider
1. 首先从官网 http://phantomjs.org/下载phantomjs压缩包，解压缩到/root/phantomjs文件夹。 2. 安装依赖 sudo yum install fontconfig freetype libfreetype.so.6 libfontconfig.so.1 libstdc++.so.6 3. 配置环境变量 vi /etc/profil
JAVA IO FileInputStream和FileOutputStream，字节流的打包输出百合不是茶 java核心思想 JAVA IO操作字节流
在程序设计语言中，数据的保存是基本，如果某程序语言不能保存数据那么该语言是不可能存在的，JAVA是当今最流行的面向对象设计语言之一，在保存数据中也有自己独特的一面，字节流和字符流 1，字节流是由字节构成的，字符流是由字符构成的字节流和字符流都是继承的InputStream和OutPutStream ,java中两种最基本的就是字节流和字符流类 FileInputStream
Spring基础实例（依赖注入和控制反转） bijian1013 spring
前提条件：在http://www.springsource.org/download网站上下载Spring框架，并将spring.jar、log4j-1.2.15.jar、commons-logging.jar加载至工程1.武器接口 package com.bijian.spring.base3; public interface Weapon { void kil
HR看重的十大技能 bijian1013 提升能力 HR 成长
一个人掌握何种技能取决于他的兴趣、能力和聪明程度，也取决于他所能支配的资源以及制定的事业目标，拥有过硬技能的人有更多的工作机会。但是，由于经济发展前景不确定，掌握对你的事业有所帮助的技能显得尤为重要。以下是最受雇主欢迎的十种技能。　　一、解决问题的能力　　每天，我们都要在生活和工作中解决一些综合性的问题。那些能够发现问题、解决问题并迅速作出有效决
【Thrift一】Thrift编译安装 bit1129 thrift
什么是Thrift The Apache Thrift software framework, for scalable cross-language services development, combines a software stack with a code generation engine to build services that work efficiently and s
【Avro三】Hadoop MapReduce读写Avro文件 bit1129 mapreduce
Avro是Doug Cutting(此人绝对是神一般的存在）牵头开发的。开发之初就是围绕着完善Hadoop生态系统的数据处理而开展的（使用Avro作为Hadoop MapReduce需要处理数据序列化和反序列化的场景）,因此Hadoop MapReduce集成Avro也就是自然而然的事情。这个例子是一个简单的Hadoop MapReduce读取Avro格式的源文件进行计数统计，然后将计算结果
nginx定制500，502，503，504页面 ronin47 nginx　错误显示
server { listen 80; error_page 500/500.html; error_page 502/502.html; error_page 503/503.html; error_page 504/504.html; location /test {return502;}} 配置很简单，和配
java-1.二叉查找树转为双向链表 bylijinnan 二叉查找树
import java.util.ArrayList; import java.util.List; public class BSTreeToLinkedList { /* 把二元查找树转变成排序的双向链表题目：输入一棵二元查找树，将该二元查找树转换成一个排序的双向链表。要求不能创建任何新的结点，只调整指针的指向。 10 / \ 6 14 / \
Netty源码学习-HTTP-tunnel bylijinnan java netty
Netty关于HTTP tunnel的说明： http://docs.jboss.org/netty/3.2/api/org/jboss/netty/channel/socket/http/package-summary.html#package_description 这个说明有点太简略了一个完整的例子在这里： https://github.com/bylijinnan
JSONUtil.serialize(map)和JSON.toJSONString(map)的区别 coder_xpf jquery json map val()
JSONUtil.serialize(map)和JSON.toJSONString(map)的区别数据库查询出来的map有一个字段为空通过System.out.println()输出 JSONUtil.serialize(map)： {"one":"1","two":"nul
Hibernate缓存总结 cuishikuan 开源 ssh javaweb hibernate缓存三大框架
一、为什么要用Hibernate缓存？ Hibernate是一个持久层框架，经常访问物理数据库。为了降低应用程序对物理数据源访问的频次，从而提高应用程序的运行性能。缓存内的数据是对物理数据源中的数据的复制，应用程序在运行时从缓存读写数据，在特定的时刻或事件会同步缓存和物理数据源的数据。二、Hibernate缓存原理是怎样的？ Hibernate缓存包括两大类：Hib
CentOs6 dalan_123 centos
首先su - 切换到root下面1、首先要先安装GCC GCC-C++ Openssl等以来模块：yum -y install make gcc gcc-c++ kernel-devel m4 ncurses-devel openssl-devel2、再安装ncurses模块yum -y install ncurses-develyum install ncurses-devel3、下载Erang
10款用 jquery 实现滚动条至页面底端自动加载数据效果 dcj3sjt126com JavaScript
无限滚动自动翻页可以说是web2.0时代的一项堪称伟大的技术，它让我们在浏览页面的时候只需要把滚动条拉到网页底部就能自动显示下一页的结果，改变了一直以来只能通过点击下一页来翻页这种常规做法。无限滚动自动翻页技术的鼻祖是微博的先驱：推特(twitter)，后来必应图片搜索、谷歌图片搜索、google reader、箱包批发网等纷纷抄袭了这一项技术，于是靠滚动浏览器滚动条
ImageButton去边框&Button或者ImageButton的背景透明 dcj3sjt126com imagebutton
在ImageButton中载入图片后，很多人会觉得有图片周围的白边会影响到美观，其实解决这个问题有两种方法一种方法是将ImageButton的背景改为所需要的图片。如：android:background="@drawable/XXX" 第二种方法就是将ImageButton背景改为透明，这个方法更常用在XML里； <ImageBut
JSP之c:foreach eksliang jsp forearch
原文出自：http://www.cnblogs.com/draem0507/archive/2012/09/24/2699745.html <c:forEach>标签用于通用数据循环，它有以下属性属性描述是否必须缺省值 items 进行循环的项目否无 begin 开始条件否 0 end 结束条件否集合中的最后一个项目 step 步长否 1
Android实现主动连接蓝牙耳机 gqdy365 android
在Android程序中可以实现自动扫描蓝牙、配对蓝牙、建立数据通道。蓝牙分不同类型，这篇文字只讨论如何与蓝牙耳机连接。大致可以分三步：一、扫描蓝牙设备： 1、注册并监听广播： BluetoothAdapter.ACTION_DISCOVERY_STARTED BluetoothDevice.ACTION_FOUND BluetoothAdapter.ACTION_DIS
android学习轨迹之四：org.json.JSONException: No value for hyz301 json
org.json.JSONException: No value for items 在JSON解析中会遇到一种错误，很常见的错误 06-21 12:19:08.714 2098-2127/com.jikexueyuan.secret I/System.out﹕ Result:{"status":1,"page":1,&
干货分享：从零开始学编程系列汇总 justjavac 编程
程序员总爱重新发明轮子，于是做了要给轮子汇总。从零开始写个编译器吧系列 (知乎专栏) 从零开始写一个简单的操作系统 (伯乐在线) 从零开始写JavaScript框架 (图灵社区) 从零开始写jQuery框架 (蓝色理想 ) 从零开始nodejs系列文章 (粉丝日志) 从零开始编写网络游戏
jquery-autocomplete 使用手册 macroli jquery Ajax 脚本
jquery-autocomplete学习一、用前必备官方网站：http://bassistance.de/jquery-plugins/jquery-plugin-autocomplete/ 当前版本：1.1 需要JQuery版本：1.2.6 二、使用 <script src="./jquery-1.3.2.js" type="text/ja
PLSQL-Developer或者Navicat等工具连接远程oracle数据库的详细配置以及数据库编码的修改超声波 oracle plsql
　　在服务器上将Oracle安装好之后接下来要做的就是通过本地机器来远程连接服务器端的oracle数据库，常用的客户端连接工具就是PLSQL-Developer或者Navicat这些工具了。刚开始也是各种报错，什么TNS:no listener;TNS:lost connection;TNS:target hosts...花了一天的时间终于让PLSQL-Developer和Navicat等这些客户
数据仓库数据模型之：极限存储--历史拉链表 superlxw1234 极限存储数据仓库数据模型拉链历史表
在数据仓库的数据模型设计过程中，经常会遇到这样的需求： 1. 数据量比较大; 2. 表中的部分字段会被update,如用户的地址，产品的描述信息，订单的状态等等; 3. 需要查看某一个时间点或者时间段的历史快照信息，比如，查看某一个订单在历史某一个时间点的状态，比如，查看某一个用户在过去某一段时间内，更新过几次等等; 4. 变化的比例和频率不是很大，比如，总共有10
10点睛Spring MVC4.1-全局异常处理 wiselyman spring mvc
10.1 全局异常处理使用@ControllerAdvice注解来实现全局异常处理; 使用@ControllerAdvice的属性缩小处理范围 10.2 演示演示控制器 package com.wisely.web; import org.springframework.stereotype.Controller; import org.spring