Refactor probe locking into shared functions

For scripts with thousands of probes, we save a fair amount of code-gen time in pass-4 by having the common locking code extracted into shared functions. * runtime/probe_lock.h (stp_lock_probe, stp_unlock_probe): New. * translate.cxx (c_unparser::emit_lock_decls): New, emits a static const array of locks needed for each probe. (c_unparser::emit_locks): Just call stp_lock_probe. (c_unparser::emit_unlocks): Just call stp_unlock_probe.
author: Josh Stone <jistone@redhat.com> 2009-10-21 16:15:58 -0700
committer: Josh Stone <jistone@redhat.com> 2009-10-21 16:36:25 -0700
commit: 29bb0bbc8603edb20de09e79fd8addb4a174947d (patch)
tree: 2d39d41b9479c87839e22b9a9c81a4830d315377 /translate.cxx
parent: 1d2cd5ff6a8ff79b09e342a5907b29b4c340a9a5 (diff)
download: systemtap-steved-29bb0bbc8603edb20de09e79fd8addb4a174947d.tar.gz
systemtap-steved-29bb0bbc8603edb20de09e79fd8addb4a174947d.tar.xz
systemtap-steved-29bb0bbc8603edb20de09e79fd8addb4a174947d.zip
1 files changed, 44 insertions, 89 deletions
diff --git a/translate.cxx b/translate.cxx
index 1109449d..ed415abb 100644
--- a/translate.cxx
+++ b/translate.cxx
@@ -73,6 +73,7 @@ struct c_unparser: public unparser, public visitor
   void emit_module_init ();
   void emit_module_exit ();
   void emit_function (functiondecl* v);
+  void emit_lock_decls (const varuse_collecting_visitor& v);
   void emit_locks (const varuse_collecting_visitor& v);
   void emit_probe (derived_probe* v);
   void emit_unlocks (const varuse_collecting_visitor& v);
@@ -1622,6 +1623,14 @@ c_unparser::emit_probe (derived_probe* v)
 
       probe_contents[oss.str()] = v->name;
 
+      // emit static read/write lock decls for global variables
+      varuse_collecting_visitor vut(*session);
+      if (v->needs_global_locks ())
+        {
+	  v->body->visit (& vut);
+	  emit_lock_decls (vut);
+	}
+
       // initialize frame pointer
       o->newline() << "struct " << v->name << "_locals * __restrict__ l =";
       o->newline(1) << "& c->probe_locals." << v->name << ";";
@@ -1638,12 +1647,8 @@ c_unparser::emit_probe (derived_probe* v)
       v->emit_probe_local_init(o);
 
       // emit all read/write locks for global variables
-      varuse_collecting_visitor vut(*session);
       if (v->needs_global_locks ())
-        {
-	  v->body->visit (& vut);
 	  emit_locks (vut);
-	}
 
       // initialize locals
       for (unsigned j=0; j<v->locals.size(); j++)
@@ -1694,13 +1699,16 @@ c_unparser::emit_probe (derived_probe* v)
 
 
 void
-c_unparser::emit_locks(const varuse_collecting_visitor& vut)
+c_unparser::emit_lock_decls(const varuse_collecting_visitor& vut)
 {
-  o->newline() << "{";
-  o->newline(1) << "unsigned numtrylock = 0;";
-  o->newline() << "(void) numtrylock;";
+  unsigned numvars = 0;
+
+  if (session->verbose > 1)
+    clog << current_probe->name << " locks ";
+
+  o->newline() << "static const struct stp_probe_lock locks[] = {";
+  o->indent(1);
 
-  string last_locked_var;
   for (unsigned i = 0; i < session->globals.size(); i++)
     {
       vardecl* v = session->globals[i];
@@ -1732,94 +1740,44 @@ c_unparser::emit_locks(const varuse_collecting_visitor& vut)
 	    continue;
 	}
 
-      string lockcall =
-        string (write_p ? "write" : "read") +
-        "_trylock (& global.s_" + v->name + "_lock)";
-
-      o->newline() << "while (! " << lockcall
-                   << "&& (++numtrylock < MAXTRYLOCK))";
-      o->newline(1) << "ndelay (TRYLOCKDELAY);";
-      o->newline(-1) << "if (unlikely (numtrylock >= MAXTRYLOCK)) {";
-      o->newline(1) << "atomic_inc (& skipped_count);";
+      o->newline() << "{";
+      o->newline(1) << ".lock = &global.s_" + v->name + "_lock,";
+      o->newline() << ".write_p = " << (write_p ? 1 : 0) << ",";
       o->newline() << "#ifdef STP_TIMING";
-      o->newline() << "atomic_inc (& global.s_" << c_varname (v->name) << "_lock_skip_count);";
+      o->newline() << ".skipped = &global.s_" << c_varname (v->name) << "_lock_skip_count,";
       o->newline() << "#endif";
-      // The following works even if i==0.  Note that using
-      // globals[i-1]->name is wrong since that global may not have
-      // been lockworthy by this probe.
-      o->newline() << "goto unlock_" << last_locked_var << ";";
-      o->newline(-1) << "}";
+      o->newline(-1) << "},";
 
-      last_locked_var = v->name;
+      numvars ++;
+      if (session->verbose > 1)
+        clog << v->name << "[" << (read_p ? "r" : "")
+             << (write_p ? "w" : "")  << "] ";
     }
 
-  o->newline() << "if (0) goto unlock_;";
+  o->newline(-1) << "};";
 
-  o->newline(-1) << "}";
+  if (session->verbose > 1)
+    {
+      if (!numvars)
+        clog << "nothing";
+      clog << endl;
+    }
 }
 
 
 void
-c_unparser::emit_unlocks(const varuse_collecting_visitor& vut)
+c_unparser::emit_locks(const varuse_collecting_visitor&)
 {
-  unsigned numvars = 0;
-
-  if (session->verbose>1)
-    clog << current_probe->name << " locks ";
-
-  for (int i = session->globals.size()-1; i>=0; i--) // in reverse order!
-    {
-      vardecl* v = session->globals[i];
-      bool read_p = vut.read.find(v) != vut.read.end();
-      bool write_p = vut.written.find(v) != vut.written.end();
-      if (!read_p && !write_p) continue;
-
-      // Duplicate lock flipping logic from above
-      if (v->type == pe_stats)
-        {
-          if (write_p && !read_p) { read_p = true; write_p = false; }
-          else if (read_p && !write_p) { read_p = false; write_p = true; }
-        }
-
-      // Duplicate "read-mostly" global variable logic from above.
-      if (read_p && !write_p)
-        {
-	  if (vcv_needs_global_locks.written.find(v)
-	      == vcv_needs_global_locks.written.end())
-	    continue;
-	}
-
-      numvars ++;
-      o->newline(-1) << "unlock_" << v->name << ":";
-      o->indent(1);
-
-      if (session->verbose>1)
-        clog << v->name << "[" << (read_p ? "r" : "")
-             << (write_p ? "w" : "")  << "] ";
-
-      if (write_p) // emit write lock
-        o->newline() << "write_unlock (& global.s_" << v->name << "_lock);";
-      else // (read_p && !write_p) : emit read lock
-        o->newline() << "read_unlock (& global.s_" << v->name << "_lock);";
-
-      // fall through to next variable; thus the reverse ordering
-    }
+  o->newline() << "if (!stp_lock_probe(locks, ARRAY_SIZE(locks)))";
+  o->newline(1) << "return;";
+  o->indent(-1);
+}
 
-  // emit plain "unlock" label, used if the very first lock failed.
-  o->newline(-1) << "unlock_: ;";
-  o->indent(1);
 
-  if (numvars) // is there a chance that any lock attempt failed?
-    {
-      // Formerly, we checked skipped_count > MAXSKIPPED here, and set
-      // SYSTEMTAP_SESSION_ERROR if so.  But now, this check is shared
-      // via common_probe_entryfn_epilogue().
-
-      if (session->verbose>1)
-        clog << endl;
-    }
-  else if (session->verbose>1)
-    clog << "nothing" << endl;
+void
+c_unparser::emit_unlocks(const varuse_collecting_visitor& vut)
+{
+  o->newline() << "stp_unlock_probe(locks, ARRAY_SIZE(locks));";
 }
 
 
@@ -5233,13 +5191,10 @@ translate_pass (systemtap_session& s)
       s.op->newline() << "#include \"loc2c-runtime.h\" ";
       s.op->newline() << "#include \"access_process_vm.h\" ";
 
-      // XXX: old 2.6 kernel hack
-      s.op->newline() << "#ifndef read_trylock";
-      s.op->newline() << "#define read_trylock(x) ({ read_lock(x); 1; })";
-      s.op->newline() << "#endif";
-
       s.up->emit_common_header (); // context etc.
 
+      s.op->newline() << "#include \"probe_lock.h\" ";
+
       for (unsigned i=0; i<s.embeds.size(); i++)
         {
           s.op->newline() << s.embeds[i]->code << "\n";
author	Josh Stone <jistone@redhat.com>	2009-10-21 16:15:58 -0700
committer	Josh Stone <jistone@redhat.com>	2009-10-21 16:36:25 -0700
commit	29bb0bbc8603edb20de09e79fd8addb4a174947d (patch)
tree	2d39d41b9479c87839e22b9a9c81a4830d315377 /translate.cxx
parent	1d2cd5ff6a8ff79b09e342a5907b29b4c340a9a5 (diff)
download	systemtap-steved-29bb0bbc8603edb20de09e79fd8addb4a174947d.tar.gz systemtap-steved-29bb0bbc8603edb20de09e79fd8addb4a174947d.tar.xz systemtap-steved-29bb0bbc8603edb20de09e79fd8addb4a174947d.zip