txtreader.go 1.7 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879
  1. package reader
  2. import (
  3. "encoding/json"
  4. "fmt"
  5. "io"
  6. "regexp"
  7. "strings"
  8. "git.wecise.com/wecise/cgimport/schema"
  9. )
  10. type TXTBlockReader struct {
  11. *LineReader
  12. filetype schema.FileType
  13. firstline string
  14. nextline string
  15. }
  16. func NewTXTBlockReader(filename string, filetype schema.FileType, reader io.Reader) *TXTBlockReader {
  17. return &TXTBlockReader{
  18. LineReader: NewLineReader(filename, reader),
  19. filetype: filetype,
  20. }
  21. }
  22. var regrecordstart = regexp.MustCompile(`^(?:[\.\/a-zA-Z0-9_]*:)?V:(\{.*)`)
  23. var regrecordend = regexp.MustCompile(`\}\s*$`)
  24. func (br *TXTBlockReader) ReadBlock(skiplines int) (block map[string]any, line string, linecount int, err error) {
  25. eof := false
  26. line = br.nextline
  27. for {
  28. for {
  29. br.nextline, linecount, eof, err = br.ReadLine()
  30. if err != nil {
  31. return
  32. }
  33. if br.nextline == "" && eof {
  34. if line == "" {
  35. return
  36. }
  37. break
  38. }
  39. if linecount <= skiplines {
  40. continue
  41. }
  42. if regrecordend.MatchString(line) {
  43. break
  44. }
  45. if regrecordstart.MatchString(br.nextline) {
  46. break
  47. }
  48. line += br.nextline
  49. }
  50. linecount--
  51. if !regrecordstart.MatchString(line) || !regrecordend.MatchString(line) {
  52. if line != "" {
  53. logger.Info(fmt.Sprint("skip non-json line ", br.filename, ":", linecount, " ", line))
  54. }
  55. if linecount == 1 {
  56. br.firstline = line
  57. }
  58. line = br.nextline
  59. continue
  60. }
  61. line = regrecordstart.ReplaceAllString(line, "$1")
  62. line = strings.ReplaceAll(line, `\`, `\\`)
  63. line = strings.ReplaceAll(line, "\t", `\t`)
  64. line = strings.ReplaceAll(line, "\r", `\r`)
  65. line = strings.ReplaceAll(line, "\n", `\n`)
  66. block = map[string]any{}
  67. err = json.Unmarshal([]byte(line), &block)
  68. if err != nil {
  69. return
  70. }
  71. return
  72. }
  73. }