/ranking/querystr.go

https://repo.or.cz/debiancodesearch.git · Go · 45 lines · 30 code · 7 blank · 8 comment · 4 complexity · 1af97fbe9ce2650b411f170253f10342 MD5 · raw file

  1. // vim:ts=4:sw=4:noexpandtab
  2. package ranking
  3. import (
  4. "regexp"
  5. "strings"
  6. )
  7. // Represents a query string with pre-compiled regular expressions for faster
  8. // matching.
  9. type QueryStr struct {
  10. query string
  11. boundaryRegexp *regexp.Regexp
  12. anywhereRegexp *regexp.Regexp
  13. }
  14. func NewQueryStr(query string) QueryStr {
  15. var result QueryStr
  16. result.query = query
  17. // Remove (?i) at the beginning of the query, which (at least currently)
  18. // means case-insensitive.
  19. strippedQuery := strings.Replace(query, "(?i)", "", 1)
  20. // XXX: This only works for very simple (one-word) queries.
  21. quotedQuery := regexp.QuoteMeta(strippedQuery)
  22. //fmt.Printf("quoted query: %s\n", quotedQuery)
  23. result.boundaryRegexp = regexp.MustCompile(`(?i)\b` + quotedQuery + `\b`)
  24. result.anywhereRegexp = regexp.MustCompile(`(?i)` + quotedQuery)
  25. return result
  26. }
  27. func (qs *QueryStr) Match(path *string) float32 {
  28. // XXX: These values might need to be tweaked.
  29. index := qs.boundaryRegexp.FindStringIndex(*path)
  30. if index != nil {
  31. return 0.75 + (0.25 * (1.0 - float32(index[0])/float32(len(*path))))
  32. }
  33. index = qs.anywhereRegexp.FindStringIndex(*path)
  34. if index != nil {
  35. return 0.5 + (0.25 * (1.0 - float32(index[0])/float32(len(*path))))
  36. }
  37. return 0.5
  38. }