PageRenderTime 42ms CodeModel.GetById 16ms RepoModel.GetById 0ms app.codeStats 0ms

/tags/release-0.0.0-rc0/hive/external/ql/src/test/org/apache/hadoop/hive/scripts/extracturl.java

#
Java | 58 lines | 29 code | 7 blank | 22 comment | 3 complexity | 6d92d6c552b66ba0d10672af57dc93a5 MD5 | raw file
Possible License(s): Apache-2.0, BSD-3-Clause, JSON, CPL-1.0
  1. /**
  2. * Licensed to the Apache Software Foundation (ASF) under one
  3. * or more contributor license agreements. See the NOTICE file
  4. * distributed with this work for additional information
  5. * regarding copyright ownership. The ASF licenses this file
  6. * to you under the Apache License, Version 2.0 (the
  7. * "License"); you may not use this file except in compliance
  8. * with the License. You may obtain a copy of the License at
  9. *
  10. * http://www.apache.org/licenses/LICENSE-2.0
  11. *
  12. * Unless required by applicable law or agreed to in writing, software
  13. * distributed under the License is distributed on an "AS IS" BASIS,
  14. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  15. * See the License for the specific language governing permissions and
  16. * limitations under the License.
  17. */
  18. package org.apache.hadoop.hive.scripts;
  19. import java.io.BufferedReader;
  20. import java.io.InputStreamReader;
  21. import java.util.regex.Matcher;
  22. import java.util.regex.Pattern;
  23. /**
  24. * extracturl.
  25. *
  26. */
  27. public final class extracturl {
  28. protected static final Pattern pattern = Pattern.compile(
  29. "<a href=\"http://([\\w\\d]+\\.html)\">link</a>",
  30. Pattern.CASE_INSENSITIVE);
  31. static InputStreamReader converter = new InputStreamReader(System.in);
  32. static BufferedReader in = new BufferedReader(converter);
  33. public static void main(String[] args) {
  34. String input;
  35. try {
  36. while ((input = in.readLine()) != null) {
  37. Matcher m = pattern.matcher(input);
  38. while (m.find()) {
  39. String url = input.substring(m.start(1), m.end(1));
  40. System.out.println(url + "\t" + "1");
  41. }
  42. }
  43. } catch (Exception e) {
  44. e.printStackTrace();
  45. System.exit(1);
  46. }
  47. }
  48. private extracturl() {
  49. // prevent instantiation
  50. }
  51. }