backup.go 8.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323
  1. // Copyright 2022 The Gogs Authors. All rights reserved.
  2. // Use of this source code is governed by a MIT-style
  3. // license that can be found in the LICENSE and LICENSE.gogs file.
  4. // Copyright 2025 Huan-Gogs Authors. All rights reserved.
  5. // Use of this source code is governed by a MIT-style
  6. // license that can be found in the LICENSE file.
  7. package database
  8. import (
  9. "bufio"
  10. "bytes"
  11. "context"
  12. "fmt"
  13. "io"
  14. "os"
  15. "path/filepath"
  16. "reflect"
  17. "strings"
  18. "sync"
  19. jsoniter "github.com/json-iterator/go"
  20. "github.com/pkg/errors"
  21. "gorm.io/gorm"
  22. "gorm.io/gorm/schema"
  23. log "unknwon.dev/clog/v2"
  24. "xorm.io/core"
  25. "xorm.io/xorm"
  26. "github.com/SongZihuan/huan-gogs/internal/conf"
  27. "github.com/SongZihuan/huan-gogs/internal/osutil"
  28. )
  29. // getTableType returns the type name of a table definition without package name,
  30. // e.g. *database.LFSObject -> LFSObject.
  31. func getTableType(t any) string {
  32. return strings.TrimPrefix(fmt.Sprintf("%T", t), "*database.")
  33. }
  34. // DumpDatabase dumps all data from database to file system in JSON Lines format.
  35. func DumpDatabase(ctx context.Context, db *gorm.DB, dirPath string, verbose bool) error {
  36. err := os.MkdirAll(dirPath, os.ModePerm)
  37. if err != nil {
  38. return err
  39. }
  40. err = dumpLegacyTables(ctx, dirPath, verbose)
  41. if err != nil {
  42. return errors.Wrap(err, "dump legacy tables")
  43. }
  44. for _, table := range Tables {
  45. select {
  46. case <-ctx.Done():
  47. return ctx.Err()
  48. default:
  49. }
  50. tableName := getTableType(table)
  51. if verbose {
  52. log.Trace("Dumping table %q...", tableName)
  53. }
  54. err := func() error {
  55. tableFile := filepath.Join(dirPath, tableName+".json")
  56. f, err := os.Create(tableFile)
  57. if err != nil {
  58. return errors.Wrap(err, "create table file")
  59. }
  60. defer func() { _ = f.Close() }()
  61. return dumpTable(ctx, db, table, f)
  62. }()
  63. if err != nil {
  64. return errors.Wrapf(err, "dump table %q", tableName)
  65. }
  66. }
  67. return nil
  68. }
  69. func dumpTable(ctx context.Context, db *gorm.DB, table any, w io.Writer) error {
  70. query := db.WithContext(ctx).Model(table)
  71. switch table.(type) {
  72. case *LFSObject:
  73. query = query.Order("repo_id, oid ASC")
  74. default:
  75. query = query.Order("id ASC")
  76. }
  77. rows, err := query.Rows()
  78. if err != nil {
  79. return errors.Wrap(err, "select rows")
  80. }
  81. defer func() { _ = rows.Close() }()
  82. for rows.Next() {
  83. elem := reflect.New(reflect.TypeOf(table).Elem()).Interface()
  84. err = db.ScanRows(rows, elem)
  85. if err != nil {
  86. return errors.Wrap(err, "scan rows")
  87. }
  88. switch e := elem.(type) {
  89. case *LFSObject:
  90. e.CreatedAt = e.CreatedAt.UTC()
  91. }
  92. err = jsoniter.NewEncoder(w).Encode(elem)
  93. if err != nil {
  94. return errors.Wrap(err, "encode JSON")
  95. }
  96. }
  97. return rows.Err()
  98. }
  99. func dumpLegacyTables(ctx context.Context, dirPath string, verbose bool) error {
  100. // Purposely create a local variable to not modify global variable
  101. legacyTables := append(legacyTables, new(Version))
  102. for _, table := range legacyTables {
  103. select {
  104. case <-ctx.Done():
  105. return ctx.Err()
  106. default:
  107. }
  108. tableName := getTableType(table)
  109. if verbose {
  110. log.Trace("Dumping table %q...", tableName)
  111. }
  112. tableFile := filepath.Join(dirPath, tableName+".json")
  113. f, err := os.Create(tableFile)
  114. if err != nil {
  115. return fmt.Errorf("create JSON file: %v", err)
  116. }
  117. if err = x.Context(ctx).Asc("id").Iterate(table, func(idx int, bean any) (err error) {
  118. return jsoniter.NewEncoder(f).Encode(bean)
  119. }); err != nil {
  120. _ = f.Close()
  121. return fmt.Errorf("dump table '%s': %v", tableName, err)
  122. }
  123. _ = f.Close()
  124. }
  125. return nil
  126. }
  127. // ImportDatabase imports data from backup archive in JSON Lines format.
  128. func ImportDatabase(ctx context.Context, db *gorm.DB, dirPath string, verbose bool) error {
  129. err := importLegacyTables(ctx, dirPath, verbose)
  130. if err != nil {
  131. return errors.Wrap(err, "import legacy tables")
  132. }
  133. for _, table := range Tables {
  134. select {
  135. case <-ctx.Done():
  136. return ctx.Err()
  137. default:
  138. }
  139. tableName := strings.TrimPrefix(fmt.Sprintf("%T", table), "*database.")
  140. err := func() error {
  141. tableFile := filepath.Join(dirPath, tableName+".json")
  142. if !osutil.IsFile(tableFile) {
  143. log.Info("Skipped table %q", tableName)
  144. return nil
  145. }
  146. if verbose {
  147. log.Trace("Importing table %q...", tableName)
  148. }
  149. f, err := os.Open(tableFile)
  150. if err != nil {
  151. return errors.Wrap(err, "open table file")
  152. }
  153. defer func() { _ = f.Close() }()
  154. return importTable(ctx, db, table, f)
  155. }()
  156. if err != nil {
  157. return errors.Wrapf(err, "import table %q", tableName)
  158. }
  159. }
  160. return nil
  161. }
  162. func importTable(ctx context.Context, db *gorm.DB, table any, r io.Reader) error {
  163. err := db.WithContext(ctx).Migrator().DropTable(table)
  164. if err != nil {
  165. return errors.Wrap(err, "drop table")
  166. }
  167. err = db.WithContext(ctx).Migrator().AutoMigrate(table)
  168. if err != nil {
  169. return errors.Wrap(err, "auto migrate")
  170. }
  171. s, err := schema.Parse(table, &sync.Map{}, db.NamingStrategy)
  172. if err != nil {
  173. return errors.Wrap(err, "parse schema")
  174. }
  175. rawTableName := s.Table
  176. skipResetIDSeq := map[string]bool{
  177. "lfs_object": true,
  178. }
  179. scanner := bufio.NewScanner(r)
  180. for scanner.Scan() {
  181. // PostgreSQL does not like the null characters (U+0000)
  182. cleaned := bytes.ReplaceAll(scanner.Bytes(), []byte("\\u0000"), []byte(""))
  183. elem := reflect.New(reflect.TypeOf(table).Elem()).Interface()
  184. err = jsoniter.Unmarshal(cleaned, elem)
  185. if err != nil {
  186. return errors.Wrap(err, "unmarshal JSON to struct")
  187. }
  188. err = db.WithContext(ctx).Create(elem).Error
  189. if err != nil {
  190. return errors.Wrap(err, "create row")
  191. }
  192. }
  193. // PostgreSQL needs manually reset table sequence for auto increment keys
  194. if conf.UsePostgreSQL && !skipResetIDSeq[rawTableName] {
  195. seqName := rawTableName + "_id_seq"
  196. if err = db.WithContext(ctx).Exec(fmt.Sprintf(`SELECT setval('%s', COALESCE((SELECT MAX(id)+1 FROM "%s"), 1), false)`, seqName, rawTableName)).Error; err != nil {
  197. return errors.Wrapf(err, "reset table %q.%q", rawTableName, seqName)
  198. }
  199. }
  200. return nil
  201. }
  202. func importLegacyTables(ctx context.Context, dirPath string, verbose bool) error {
  203. snakeMapper := core.SnakeMapper{}
  204. skipInsertProcessors := map[string]bool{
  205. "mirror": true,
  206. "milestone": true,
  207. }
  208. // Purposely create a local variable to not modify global variable
  209. legacyTables := append(legacyTables, new(Version))
  210. for _, table := range legacyTables {
  211. select {
  212. case <-ctx.Done():
  213. return ctx.Err()
  214. default:
  215. }
  216. tableName := strings.TrimPrefix(fmt.Sprintf("%T", table), "*database.")
  217. tableFile := filepath.Join(dirPath, tableName+".json")
  218. if !osutil.IsFile(tableFile) {
  219. continue
  220. }
  221. if verbose {
  222. log.Trace("Importing table %q...", tableName)
  223. }
  224. if err := x.DropTables(table); err != nil {
  225. return fmt.Errorf("drop table %q: %v", tableName, err)
  226. } else if err = x.Sync2(table); err != nil {
  227. return fmt.Errorf("sync table %q: %v", tableName, err)
  228. }
  229. f, err := os.Open(tableFile)
  230. if err != nil {
  231. return fmt.Errorf("open JSON file: %v", err)
  232. }
  233. rawTableName := x.TableName(table)
  234. _, isInsertProcessor := table.(xorm.BeforeInsertProcessor)
  235. scanner := bufio.NewScanner(f)
  236. for scanner.Scan() {
  237. if err = jsoniter.Unmarshal(scanner.Bytes(), table); err != nil {
  238. return fmt.Errorf("unmarshal to struct: %v", err)
  239. }
  240. if _, err = x.Insert(table); err != nil {
  241. return fmt.Errorf("insert strcut: %v", err)
  242. }
  243. var meta struct {
  244. ID int64
  245. CreatedUnix int64
  246. DeadlineUnix int64
  247. ClosedDateUnix int64
  248. }
  249. if err = jsoniter.Unmarshal(scanner.Bytes(), &meta); err != nil {
  250. log.Error("Failed to unmarshal to map: %v", err)
  251. }
  252. // Reset created_unix back to the date save in archive because Insert method updates its value
  253. if isInsertProcessor && !skipInsertProcessors[rawTableName] {
  254. if _, err = x.Exec("UPDATE `"+rawTableName+"` SET created_unix=? WHERE id=?", meta.CreatedUnix, meta.ID); err != nil {
  255. log.Error("Failed to reset '%s.created_unix': %v", rawTableName, err)
  256. }
  257. }
  258. switch rawTableName {
  259. case "milestone":
  260. if _, err = x.Exec("UPDATE `"+rawTableName+"` SET deadline_unix=?, closed_date_unix=? WHERE id=?", meta.DeadlineUnix, meta.ClosedDateUnix, meta.ID); err != nil {
  261. log.Error("Failed to reset 'milestone.deadline_unix', 'milestone.closed_date_unix': %v", err)
  262. }
  263. }
  264. }
  265. // PostgreSQL needs manually reset table sequence for auto increment keys
  266. if conf.UsePostgreSQL {
  267. rawTableName := snakeMapper.Obj2Table(tableName)
  268. seqName := rawTableName + "_id_seq"
  269. if _, err = x.Exec(fmt.Sprintf(`SELECT setval('%s', COALESCE((SELECT MAX(id)+1 FROM "%s"), 1), false);`, seqName, rawTableName)); err != nil {
  270. return fmt.Errorf("reset table %q' sequence: %v", rawTableName, err)
  271. }
  272. }
  273. }
  274. return nil
  275. }